Files
ascend-tools/train/docker_ct_build.sh
T
2020-10-19 20:22:23 +08:00

24 lines
1.3 KiB
Bash

#!/bin/bash
currentDir=$(cd "$(dirname "$0")"; pwd)
yamlpath=${currentDir%train*}train/yaml/cluster_info.yaml
toolsPath=${currentDir%train*}train/atlas_benchmark-master/utils/shell
# 从 yaml 获取配置
eval $(${toolsPath}/get_params_for_yaml.sh ${yamlpath} 'tensorflow_config')
# docker网络桥接
echo $(route -n|awk '{print $1}'|sed -n '4p')
echo $(route -n|awk '{print $2}'|sed -n '3p')
echo $(route -n|awk '{print $8}'|sed -n '3p')
docker network create -d macvlan --subnet=$(route -n|awk '{print $1}'|sed -n '4p')/${epcount} --gateway=$(route -n|awk '{print $2}'|sed -n '3p') -o parent=$(route -n|awk '{print $8}'|sed -n '3p') $(route -n|awk '{print $8}'|sed -n '3p')
data="-v ${imagenet_data}:${imagenet_data} -v ${yolo_data}:${yolo_data} -v ${ssd_data}:${ssd_data} -v ${bert_data}:${bert_data}"
# docroute -nker容器挂载
docker run -ti -d --net=$(route -n|awk '{print $8}'|sed -n '3p') --ip=${ip} --name mpirun --shm-size=16g -e ASCEND_VISIBLE_DEVICES=0-7 -v ${currentDir%train*}/train:${currentDir%train*}/train ${data} -v /var/log/npu/slog/:/var/log/npu/slog -v /var/log/npu/profiling/:/var/log/npu/profiling -v /var/log/npu/dump/:/var/log/npu/dump -v /var/log/npu/:/usr/slog ${docker_images} /bin/bash
docker exec -ti mpirun /bin/bash -c "/etc/init.d/ssh start"