account_id: &ACCOUNT_ID region: ®ION framework: &FRAMEWORK pytorch version: &VERSION 1.13.1 short_version: &SHORT_VERSION "1.13" arch_type: x86 repository_info: training_repository: &TRAINING_REPOSITORY image_type: &TRAINING_IMAGE_TYPE training root: !join [ *FRAMEWORK, "/", *TRAINING_IMAGE_TYPE ] repository_name: &REPOSITORY_NAME !join [pr, "-", *FRAMEWORK, "-", *TRAINING_IMAGE_TYPE] repository: &REPOSITORY !join [ *ACCOUNT_ID, .dkr.ecr., *REGION, .amazonaws.com/, *REPOSITORY_NAME ] context: training_context: &TRAINING_CONTEXT changehostname: source: docker/build_artifacts/changehostname.c target: changehostname.c start_with_right_hostname: source: docker/build_artifacts/start_with_right_hostname.sh target: start_with_right_hostname.sh example_mnist_file: source: docker/build_artifacts/mnist.py target: mnist.py deep_learning_container: source: ../../src/deep_learning_container.py target: deep_learning_container.py images: # BuildEC2CPUPTTrainPy3DockerImage: # <<: *TRAINING_REPOSITORY # build: &PYTORCH_CPU_TRAINING_PY3 false # image_size_baseline: 5000 # device_type: &DEVICE_TYPE cpu # python_version: &DOCKER_PYTHON_VERSION py3 # tag_python_version: &TAG_PYTHON_VERSION py39 # os_version: &OS_VERSION ubuntu20.04 # tag: !join [ *VERSION, "-", *DEVICE_TYPE, "-", *TAG_PYTHON_VERSION, "-", *OS_VERSION, "-ec2" ] # docker_file: !join [ docker/, *SHORT_VERSION, /, *DOCKER_PYTHON_VERSION, /Dockerfile., *DEVICE_TYPE ] # target: ec2 # context: # <<: *TRAINING_CONTEXT # BuildEC2GPUPTTrainPy3DockerImage: # <<: *TRAINING_REPOSITORY # build: &PYTORCH_GPU_TRAINING_PY3 false # image_size_baseline: 14000 # device_type: &DEVICE_TYPE gpu # python_version: &DOCKER_PYTHON_VERSION py3 # tag_python_version: &TAG_PYTHON_VERSION py39 # cuda_version: &CUDA_VERSION cu117 # os_version: &OS_VERSION ubuntu20.04 # tag: !join [ *VERSION, "-", *DEVICE_TYPE, "-", *TAG_PYTHON_VERSION, "-", *CUDA_VERSION, "-", *OS_VERSION, "-ec2" ] # docker_file: !join [ docker/, *SHORT_VERSION, /, *DOCKER_PYTHON_VERSION, /, *CUDA_VERSION, /Dockerfile., # *DEVICE_TYPE ] # target: ec2 # context: # <<: *TRAINING_CONTEXT BuildSageMakerCPUPTTrainPy3DockerImage: <<: *TRAINING_REPOSITORY build: &PYTORCH_CPU_TRAINING_PY3 false image_size_baseline: 6200 device_type: &DEVICE_TYPE cpu python_version: &DOCKER_PYTHON_VERSION py3 tag_python_version: &TAG_PYTHON_VERSION py39 os_version: &OS_VERSION ubuntu20.04 tag: !join [ *VERSION, "-", *DEVICE_TYPE, "-", *TAG_PYTHON_VERSION, "-", *OS_VERSION, "-sagemaker" ] docker_file: !join [ docker/, *SHORT_VERSION, /, *DOCKER_PYTHON_VERSION, /Dockerfile., *DEVICE_TYPE ] target: sagemaker context: <<: *TRAINING_CONTEXT BuildSageMakerGPUPTTrainPy3DockerImage: <<: *TRAINING_REPOSITORY build: &PYTORCH_GPU_TRAINING_PY3 false image_size_baseline: 14000 device_type: &DEVICE_TYPE gpu python_version: &DOCKER_PYTHON_VERSION py3 tag_python_version: &TAG_PYTHON_VERSION py39 cuda_version: &CUDA_VERSION cu117 os_version: &OS_VERSION ubuntu20.04 tag: !join [ *VERSION, "-", *DEVICE_TYPE, "-", *TAG_PYTHON_VERSION, "-", *CUDA_VERSION, "-", *OS_VERSION, "-sagemaker" ] docker_file: !join [ docker/, *SHORT_VERSION, /, *DOCKER_PYTHON_VERSION, /, *CUDA_VERSION, /Dockerfile., *DEVICE_TYPE ] target: sagemaker context: <<: *TRAINING_CONTEXT # BuildPyTorchExampleGPUTrainPy3DockerImage: # <<: *TRAINING_REPOSITORY # build: &PYTORCH_GPU_TRAINING_PY3 false # image_size_baseline: 14000 # base_image_name: BuildEC2GPUPTTrainPy3DockerImage # device_type: &DEVICE_TYPE gpu # python_version: &DOCKER_PYTHON_VERSION py3 # tag_python_version: &TAG_PYTHON_VERSION py39 # cuda_version: &CUDA_VERSION cu117 # os_version: &OS_VERSION ubuntu20.04 # tag: !join [ *VERSION, "-", *DEVICE_TYPE, "-", *TAG_PYTHON_VERSION, "-", *CUDA_VERSION, "-", *OS_VERSION, # "-ec2-example" ] # docker_file: !join [ docker/, *SHORT_VERSION, /, *DOCKER_PYTHON_VERSION, /example, /Dockerfile., *DEVICE_TYPE ] # context: # <<: *TRAINING_CONTEXT