mirror of
https://github.com/modelscope/modelscope.git
synced 2025-12-16 16:27:45 +01:00
* fix ci issue * fix case issue * modify lint to python3.10 * fix case issue --------- Co-authored-by: mulin.lyh <mulin.lyh@taobao.com>
233 lines
9.1 KiB
Bash
233 lines
9.1 KiB
Bash
#!/bin/bash
|
|
# default values.
|
|
#BASE_PY37_CPU_IMAGE=reg.docker.alibaba-inc.com/modelscope/modelscope:ubuntu20.04-py37-torch1.11.0-tf1.15.5-base
|
|
#BASE_PY38_CPU_IMAGE=reg.docker.alibaba-inc.com/modelscope/modelscope:ubuntu20.04-py38-torch1.11.0-tf1.15.5-base
|
|
#BASE_PY38_GPU_IMAGE=reg.docker.alibaba-inc.com/modelscope/modelscope:ubuntu20.04-cuda11.3.0-py38-torch1.11.0-tf1.15.5-base
|
|
#BASE_PY38_GPU_IMAGE=reg.docker.alibaba-inc.com/modelscope/modelscope:ubuntu20.04-cuda11.7.1-py38-torch2.0.1-tf1.15.5-base
|
|
#BASE_PY38_GPU_IMAGE=reg.docker.alibaba-inc.com/modelscope/modelscope:ubuntu20.04-cuda11.7.1-py38-torch1.13.1-tf2.6.0-base
|
|
#BASE_PY37_GPU_IMAGE=reg.docker.alibaba-inc.com/modelscope/modelscope:ubuntu20.04-cuda11.3.0-py37-torch1.11.0-tf1.15.5-base
|
|
MODELSCOPE_REPO_ADDRESS=reg.docker.alibaba-inc.com/modelscope/modelscope
|
|
python_version=3.7.13
|
|
torch_version=1.11.0
|
|
cudatoolkit_version=11.7
|
|
tensorflow_version=1.15.5
|
|
modelscope_version=None
|
|
cuda_version=11.7.1
|
|
is_ci_test=False
|
|
is_dsw=False
|
|
is_cpu=False
|
|
run_ci_test=False
|
|
function usage(){
|
|
echo "usage: build.sh "
|
|
echo " --python=python_version set python version, default: $python_version"
|
|
echo " --cuda=cuda_version set cuda version,only[11.3.0, 11.7.1], fefault: $cuda_version"
|
|
echo " --torch=torch_version set pytorch version, fefault: $torch_version"
|
|
echo " --tensorflow=tensorflow_version set tensorflow version, default: $tensorflow_version"
|
|
echo " --modelscope=modelscope_version set modelscope version, default: $modelscope_version"
|
|
echo " --test option for run test before push image, only push on ci test pass"
|
|
echo " --cpu option for build cpu version"
|
|
echo " --dsw option for build dsw version"
|
|
echo " --ci option for build ci version"
|
|
echo " --push option for push image to remote repo"
|
|
}
|
|
for i in "$@"; do
|
|
case $i in
|
|
--python=*)
|
|
python_version="${i#*=}"
|
|
shift
|
|
;;
|
|
--cuda=*)
|
|
cuda_version="${i#*=}"
|
|
if [ "$cuda_version" == "11.3.0" ]; then
|
|
cudatoolkit_version=11.3
|
|
elif [ "$cuda_version" == "11.7.1" ]; then
|
|
cudatoolkit_version=11.7
|
|
elif [ "$cuda_version" == "11.8.0" ]; then
|
|
cudatoolkit_version=11.8
|
|
elif [ "$cuda_version" == "12.1.0" ]; then
|
|
cudatoolkit_version=12.1
|
|
else
|
|
echo "Unsupport cuda version $cuda_version"
|
|
exit 1
|
|
fi
|
|
shift # pytorch version
|
|
;;
|
|
--torch=*)
|
|
torch_version="${i#*=}"
|
|
shift # pytorch version
|
|
;;
|
|
--tensorflow=*)
|
|
tensorflow_version="${i#*=}"
|
|
shift # tensorflow version
|
|
;;
|
|
--cudatoolkit=*)
|
|
cudatoolkit_version="${i#*=}"
|
|
shift # cudatoolkit for pytorch
|
|
;;
|
|
--modelscope=*)
|
|
modelscope_version="${i#*=}"
|
|
shift # modelscope version
|
|
;;
|
|
--test)
|
|
run_ci_test=True
|
|
shift # will run ci test
|
|
;;
|
|
--cpu)
|
|
is_cpu=True
|
|
shift # is cpu image
|
|
;;
|
|
--ci)
|
|
is_ci_test=True
|
|
shift # is ci, will not install modelscope
|
|
;;
|
|
--dsw)
|
|
is_dsw=True
|
|
shift # is dsw, will set dsw cache location
|
|
;;
|
|
--push)
|
|
is_push=True
|
|
shift # option for push image to remote repo
|
|
;;
|
|
--help)
|
|
usage
|
|
exit 0
|
|
;;
|
|
-*|--*)
|
|
echo "Unknown option $i"
|
|
usage
|
|
exit 1
|
|
;;
|
|
*)
|
|
;;
|
|
esac
|
|
done
|
|
|
|
if [ "$modelscope_version" == "None" ]; then
|
|
echo "ModelScope version must specify!"
|
|
exit 1
|
|
fi
|
|
if [ "$is_cpu" == "True" ]; then
|
|
base_tag=ubuntu20.04
|
|
export USE_GPU=False
|
|
else
|
|
base_tag=ubuntu20.04-cuda$cuda_version
|
|
export USE_GPU=True
|
|
fi
|
|
|
|
if [[ $python_version == 3.7* ]]; then
|
|
if [ "$is_cpu" == "True" ]; then
|
|
echo "Building python3.7 cpu image"
|
|
export BASE_IMAGE=reg.docker.alibaba-inc.com/modelscope/modelscope:ubuntu20.04-py37-torch$torch_version-tf$tensorflow_version-base
|
|
else
|
|
echo "Building python3.7 gpu image"
|
|
export BASE_IMAGE=reg.docker.alibaba-inc.com/modelscope/modelscope:ubuntu20.04-cuda$cuda_version-py37-torch$torch_version-tf$tensorflow_version-base
|
|
fi
|
|
base_tag=$base_tag-py37
|
|
elif [[ $python_version == 3.8* ]]; then
|
|
if [ "$is_cpu" == "True" ]; then
|
|
echo "Building python3.8 cpu image"
|
|
export BASE_IMAGE=reg.docker.alibaba-inc.com/modelscope/modelscope:ubuntu20.04-py38-torch$torch_version-tf$tensorflow_version-base
|
|
else
|
|
echo "Building python3.8 gpu image"
|
|
export BASE_IMAGE=reg.docker.alibaba-inc.com/modelscope/modelscope:ubuntu20.04-cuda$cuda_version-py38-torch$torch_version-tf$tensorflow_version-base
|
|
fi
|
|
base_tag=$base_tag-py38
|
|
elif [[ $python_version == 3.10* ]]; then
|
|
if [ "$is_cpu" == "True" ]; then
|
|
echo "Building python3.10 cpu image"
|
|
base_tag=ubuntu22.04-py310
|
|
export BASE_IMAGE=reg.docker.alibaba-inc.com/modelscope/modelscope:ubuntu22.04-py310-torch$torch_version-tf$tensorflow_version-base
|
|
else
|
|
echo "Building python3.10 gpu image"
|
|
base_tag=ubuntu22.04-cuda$cuda_version-py310
|
|
# reg.docker.alibaba-inc.com/modelscope/modelscope:ubuntu22.04-cuda12.1.0-py310-torch2.1.0-tf2.14.0-base
|
|
export BASE_IMAGE=reg.docker.alibaba-inc.com/modelscope/modelscope:ubuntu22.04-cuda$cuda_version-py310-torch$torch_version-tf$tensorflow_version-base
|
|
fi
|
|
else
|
|
echo "Unsupport python version: $python_version"
|
|
exit 1
|
|
fi
|
|
|
|
target_image_tag=$base_tag-torch$torch_version-tf$tensorflow_version
|
|
if [ "$is_ci_test" == "True" ]; then
|
|
target_image_tag=$target_image_tag-$modelscope_version-ci
|
|
else
|
|
target_image_tag=$target_image_tag-$modelscope_version-test
|
|
fi
|
|
export IMAGE_TO_BUILD=$MODELSCOPE_REPO_ADDRESS:$target_image_tag
|
|
export PYTHON_VERSION=$python_version
|
|
export TORCH_VERSION=$torch_version
|
|
export CUDATOOLKIT_VERSION=$cudatoolkit_version
|
|
export TENSORFLOW_VERSION=$tensorflow_version
|
|
echo -e "Building image with:\npython$python_version\npytorch$torch_version\ntensorflow:$tensorflow_version\ncudatoolkit:$cudatoolkit_version\ncpu:$is_cpu\nis_ci:$is_ci_test\nis_dsw:$is_dsw\n"
|
|
echo -e "Base iamge: $BASE_IMAGE"
|
|
docker_file_content=`cat docker/Dockerfile.ubuntu`
|
|
if [ "$is_ci_test" != "True" ]; then
|
|
echo "Building ModelScope lib, will install ModelScope lib to image"
|
|
docker_file_content="${docker_file_content} \nRUN export COMMIT_ID=$CIS_ENV_COMMIT_ID && pip install --no-cache-dir -U adaseq pai-easycv ms_swift funasr 'transformers==4.36.2'"
|
|
docker_file_content="${docker_file_content} \nRUN pip uninstall modelscope -y && export COMMIT_ID=$CIS_ENV_COMMIT_ID && cd /tmp && GIT_LFS_SKIP_SMUDGE=1 git clone -b $CIS_ENV_BRANCH --single-branch $REPO_URL && cd MaaS-lib && pip install . && cd / && rm -fr /tmp/MaaS-lib"
|
|
MMCV_WITH_OPS=1 MAX_JOBS=32 pip install --no-cache-dir 'mmcv-full<=1.7.0' && pip cache purge; \
|
|
fi
|
|
echo "$is_dsw"
|
|
if [ "$is_dsw" == "False" ]; then
|
|
echo "Not DSW image"
|
|
else
|
|
echo "Building dsw image will need set ModelScope lib cache location."
|
|
docker_file_content="${docker_file_content} \nENV MODELSCOPE_CACHE=/mnt/workspace/.cache/modelscope"
|
|
# pre compile extension
|
|
docker_file_content="${docker_file_content} \nRUN pip uninstall -y tb-nightly && pip install --no-cache-dir -U tensorboard && TORCH_CUDA_ARCH_LIST='6.0 6.1 7.0 7.5 8.0 8.9 9.0 8.6+PTX' python -c 'from modelscope.utils.pre_compile import pre_compile_all;pre_compile_all()'"
|
|
fi
|
|
if [ "$is_ci_test" == "True" ]; then
|
|
echo "Building CI image, uninstall modelscope"
|
|
docker_file_content="${docker_file_content} \nRUN pip uninstall modelscope -y"
|
|
fi
|
|
docker_file_content="${docker_file_content} \n RUN cp /tmp/resources/conda.aliyun ~/.condarc && \
|
|
pip config set global.index-url https://mirrors.aliyun.com/pypi/simple && \
|
|
pip config set install.trusted-host mirrors.aliyun.com && \
|
|
cp /tmp/resources/ubuntu2204.aliyun /etc/apt/sources.list "
|
|
|
|
printf "$docker_file_content" > Dockerfile
|
|
|
|
while true
|
|
do
|
|
docker build --progress=plain -t $IMAGE_TO_BUILD \
|
|
--build-arg USE_GPU \
|
|
--build-arg BASE_IMAGE \
|
|
--build-arg PYTHON_VERSION \
|
|
--build-arg TORCH_VERSION \
|
|
--build-arg CUDATOOLKIT_VERSION \
|
|
--build-arg TENSORFLOW_VERSION \
|
|
-f Dockerfile .
|
|
if [ $? -eq 0 ]; then
|
|
echo "Image build done"
|
|
break
|
|
else
|
|
echo "Running docker build command error, we will retry"
|
|
fi
|
|
done
|
|
|
|
if [ "$run_ci_test" == "True" ]; then
|
|
echo "Running ci case."
|
|
export MODELSCOPE_CACHE=/home/mulin.lyh/model_scope_cache
|
|
export MODELSCOPE_HOME_CACHE=/home/mulin.lyh/ci_case_home # for credential
|
|
export IMAGE_NAME=$MODELSCOPE_REPO_ADDRESS
|
|
export IMAGE_VERSION=$target_image_tag
|
|
export MODELSCOPE_DOMAIN=www.modelscope.cn
|
|
export HUB_DATASET_ENDPOINT=http://www.modelscope.cn
|
|
export CI_TEST=True
|
|
export TEST_LEVEL=1
|
|
if [ "$is_ci_test" != "True" ]; then
|
|
echo "Testing for dsw image or MaaS-lib image"
|
|
export CI_COMMAND="python tests/run.py"
|
|
fi
|
|
bash .dev_scripts/dockerci.sh
|
|
if [ $? -ne 0 ]; then
|
|
echo "Running unittest failed, please check the log!"
|
|
exit -1
|
|
fi
|
|
fi
|
|
if [ "$is_push" == "True" ]; then
|
|
echo "Pushing image: $IMAGE_TO_BUILD"
|
|
docker push $IMAGE_TO_BUILD
|
|
fi
|