environments acft group relative policy optimization - Azure/azureml-assets GitHub Wiki
Environment used by Group Relative Policy Optimization component
Version: 15
Preview
View in Studio: https://ml.azure.com/registries/azureml/environments/acft-group-relative-policy-optimization/version/15
Docker image: mcr.microsoft.com/azureml/curated/acft-group-relative-policy-optimization:15
#PTCA image
FROM mcr.microsoft.com/aifx/acpt/stable-ubuntu2204-cu126-py310-torch280:biweekly.202603.1
USER root
RUN apt-get update && apt-get -y upgrade && apt-get clean && rm -rf /var/lib/apt/lists/*
COPY requirements.txt .
RUN pip install -r requirements.txt --no-cache-dir
RUN pip install azureml-evaluate-mlflow==0.0.87
RUN pip install azureml-acft-common-components==0.0.87
RUN pip install transformers==4.56.0
# upgrade pip, wheel, setuptools and transitive deps to fix vulnerabilities
# protobuf is a transitive dep of vllm; parent uses loose floors, cannot force 6.33.5
RUN pip install --upgrade pip==26.0 wheel==0.46.2 setuptools==82.0.0 protobuf==6.33.5 cryptography==46.0.5 pyasn1==0.6.2 python-multipart==0.0.22 urllib3==2.6.3 azure-core==1.38.0
# clean conda and pip caches
RUN rm -rf ~/.cache/pip
# vulnerability in base conda env
RUN conda run -n base python -m pip install --upgrade urllib3==2.6.3 aiohttp==3.13.3 PyNaCl==1.6.2 pip==26.0 wheel==0.46.2 setuptools==82.0.0 cryptography==46.0.5