environments ai ml automl dnn gpu - Azure/azureml-assets GitHub Wiki
An environment used by Azure ML AutoML for training models.
Version: 44
OS : Ubuntu20.04 Training Preview OpenMpi : 4.1.0 Python : 3.9
View in Studio: https://ml.azure.com/registries/azureml/environments/ai-ml-automl-dnn-gpu/version/44
Docker image: mcr.microsoft.com/azureml/curated/ai-ml-automl-dnn-gpu:44
FROM mcr.microsoft.com/azureml/openmpi5.0-cuda12.4-ubuntu22.04:20260315.v1
USER root
ENV AZUREML_CONDA_ENVIRONMENT_PATH=/azureml-envs/azureml-automl-dnn-gpu
# Prepend path to AzureML conda environment
ENV PATH=$AZUREML_CONDA_ENVIRONMENT_PATH/bin:$PATH
COPY --from=mcr.microsoft.com/azureml/mlflow-ubuntu20.04-py38-cpu-inference:20250506.v1 /var/mlflow_resources/ /var/mlflow_resources/
ENV MLFLOW_MODEL_FOLDER="mlflow-model"
# ENV AML_APP_ROOT="/var/mlflow_resources"
# ENV AZUREML_ENTRY_SCRIPT="mlflow_score_script.py"
ENV ENABLE_METADATA=true
RUN mkdir -p /etc/OpenCL/vendors && echo "libnvidia-opencl.so.1" > /etc/OpenCL/vendors/nvidia.icd
RUN apt-get update && \
apt-get install -y --no-install-recommends \
cmake \
libboost-dev \
libboost-system-dev \
libboost-filesystem-dev && \
apt-get clean && rm -rf /var/lib/apt/lists/*
RUN conda create -p $AZUREML_CONDA_ENVIRONMENT_PATH python=3.10 pip=26.0 -y
###############################
# Pre-Build LightGBM
###############################
RUN pip install --upgrade lightgbm==4.6.0
###############################
# Install GPU LightGBM and XgBoost
###############################
RUN pip install --upgrade --force-reinstall xgboost==1.5.2 pandas==1.5.3
# begin conda create
# Install ncurses via conda (C library, not available on pip; single-package solve is trivial)
RUN conda install -p $AZUREML_CONDA_ENVIRONMENT_PATH \
ncurses=6.5 \
-c conda-forge -y
# Install packages via pip (avoids conda solver OOM)
RUN pip install --no-cache-dir \
'numpy>=1.23.5,<1.24' \
'scikit-learn==1.5.1' \
'holidays==0.29' \
'setuptools-git' \
'wheel>=0.46.2' \
'scipy==1.10.1' \
'joblib==1.2.0'
# Ensure future conda and pip calls are tied to this conda environment,
# and we don't just get lucky from the implicit PATH ordering.
SHELL ["conda", "run", "-p", "$AZUREML_CONDA_ENVIRONMENT_PATH", "/bin/bash", "-c"]
# end conda create
# begin pip install
# Install pip dependencies
RUN pip install \
# begin pypi dependencies
azureml-core==1.61.0.post3 \
azureml-pipeline-core==1.62.0 \
azureml-telemetry==1.62.0 \
azureml-defaults==1.62.0 \
azureml-interpret==1.62.0 \
azureml-responsibleai==1.62.0 \
azureml-automl-core==1.62.0 \
azureml-automl-runtime==1.62.0 \
azureml-train-automl-client==1.62.0 \
azureml-train-automl-runtime==1.62.0 \
azureml-dataset-runtime==1.62.0 \
azureml-mlflow==1.62.0.post1 \
'azureml-model-management-sdk==1.0.1b6.post1' \
'mlflow-skinny==2.15.1' \
'azure-identity>=1.25.1' --no-cache-dir
RUN pip install \
'inference-schema' \
'cmdstanpy==1.0.4' \
'prophet==1.1.4' \
'pytorch-transformers==1.0.0' --no-cache-dir
RUN pip install \
'spacy==3.7.4' \
'https://aka.ms/automl-resources/packages/en_core_web_sm-3.7.1.tar.gz' \
'py-cpuinfo==5.0.0' \
'jinja2>=3.1.6' --no-cache-dir
# end pypi dependencies
# Fix vulnerabilities - overrides needed because parent packages cap vulnerable versions
# torchvision==0.23.0, torch==2.8.0: CVE-2025-32434 RCE via torch.load (via pytorch-transformers -> torch, horovod)
# distributed>=2026.1.0: CVE-2026-23528 (via azureml-train-automl-runtime -> dask[complete] -> distributed)
# mlflow-skinny>=2.16.0: security fixes (via azureml-mlflow -> mlflow-skinny, also installed directly)
# protobuf>=5.29.6: CVE-2026-0994 DoS recursion (via mlflow-skinny -> protobuf, azureml-automl-runtime -> onnx/onnxruntime)
# pillow>=12.1.1: CVE-2026-25990 heap buffer overflow (via torchvision -> pillow, prophet -> matplotlib -> pillow)
# tornado>=6.5.5: GHSA-78cv-mqj4-43f7 DoS (via distributed -> tornado, bokeh -> tornado)
# bokeh>=3.8.2: GHSA-793v-589g-574v CSWSH (overrides azureml-train-automl-runtime's bokeh<3.0.0 cap)
# Note: cryptography, setuptools, jaraco.context overrides removed — verified not needed (base image resolves safe versions)
RUN pip install --upgrade torchvision==0.23.0 torch==2.8.0 --no-cache-dir
RUN pip install --upgrade 'distributed>=2026.1.0' 'mlflow-skinny>=2.16.0' \
'protobuf>=5.29.6' 'pillow>=12.1.1' 'tornado>=6.5.5' 'bokeh>=3.8.2'
# --- End Vulnerability Fixes ---
RUN /bin/bash -c "source activate $AZUREML_CONDA_ENVIRONMENT_PATH && \
export CUDACXX=/usr/local/cuda/bin/nvcc && \
export HOROVOD_BUILD_CUDA_CC_LIST='60,61,70,75,80,86,89,90' && \
HOROVOD_WITH_PYTORCH=1 \
HOROVOD_CUDA_HOME=/usr/local/cuda \
CMAKE_LIBRARY_PATH=/usr/local/cuda/targets/x86_64-linux/lib:/usr/local/cuda-12.6/targets/x86_64-linux/lib \
pip install --no-cache-dir --no-build-isolation \
git+https://github.com/horovod/horovod@3a31d933a13c7c885b8a673f4172b17914ad334d"
RUN rm -rf /opt/miniconda/pkgs/
ENV LD_LIBRARY_PATH=$AZUREML_CONDA_ENVIRONMENT_PATH/lib:$LD_LIBRARY_PATH