summaryrefslogtreecommitdiff
path: root/share/spack
diff options
context:
space:
mode:
authorAdam J. Stewart <ajstewart426@gmail.com>2022-12-22 11:31:40 -0600
committerGitHub <noreply@github.com>2022-12-22 11:31:40 -0600
commiteb67497020f64de7a10f683eda0177a637b4ccf0 (patch)
treee2961e5889ecc01315f75c9f917d36a9b82227c0 /share/spack
parent371268a9aae0bc5cc3c055088130baf5d2cef340 (diff)
downloadspack-eb67497020f64de7a10f683eda0177a637b4ccf0.tar.gz
spack-eb67497020f64de7a10f683eda0177a637b4ccf0.tar.bz2
spack-eb67497020f64de7a10f683eda0177a637b4ccf0.tar.xz
spack-eb67497020f64de7a10f683eda0177a637b4ccf0.zip
ML CI: Linux x86_64 (#34299)
* ML CI: Linux x86_64 * Update comments * Rename again * Rename comments * Update to match other arches * No compiler * Compiler was wrong anyway * Faster TF
Diffstat (limited to 'share/spack')
-rw-r--r--share/spack/gitlab/cloud_pipelines/.gitlab-ci.yml106
-rw-r--r--share/spack/gitlab/cloud_pipelines/stacks/ml-linux-x86_64-cpu/spack.yaml (renamed from share/spack/gitlab/cloud_pipelines/stacks/ml-cpu/spack.yaml)143
-rw-r--r--share/spack/gitlab/cloud_pipelines/stacks/ml-linux-x86_64-cuda/spack.yaml (renamed from share/spack/gitlab/cloud_pipelines/stacks/ml-cuda/spack.yaml)143
-rw-r--r--share/spack/gitlab/cloud_pipelines/stacks/ml-linux-x86_64-rocm/spack.yaml (renamed from share/spack/gitlab/cloud_pipelines/stacks/ml-rocm/spack.yaml)147
4 files changed, 283 insertions, 256 deletions
diff --git a/share/spack/gitlab/cloud_pipelines/.gitlab-ci.yml b/share/spack/gitlab/cloud_pipelines/.gitlab-ci.yml
index 8122cd7f35..8800387436 100644
--- a/share/spack/gitlab/cloud_pipelines/.gitlab-ci.yml
+++ b/share/spack/gitlab/cloud_pipelines/.gitlab-ci.yml
@@ -760,122 +760,122 @@ tutorial-protected-build:
- artifacts: True
job: tutorial-protected-generate
-########################################
-# Machine Learning (CPU)
-########################################
-.ml-cpu:
+#######################################
+# Machine Learning - Linux x86_64 (CPU)
+#######################################
+.ml-linux-x86_64-cpu:
variables:
- SPACK_CI_STACK_NAME: ml-cpu
+ SPACK_CI_STACK_NAME: ml-linux-x86_64-cpu
-.ml-cpu-generate:
- extends: .ml-cpu
+.ml-linux-x86_64-cpu-generate:
+ extends: .ml-linux-x86_64-cpu
image: ghcr.io/spack/e4s-amazonlinux-2:v2022-03-21
tags: ["spack", "aws", "public", "medium", "x86_64_v4"]
-ml-cpu-pr-generate:
- extends: [ ".ml-cpu-generate", ".pr-generate"]
+ml-linux-x86_64-cpu-pr-generate:
+ extends: [ ".ml-linux-x86_64-cpu-generate", ".pr-generate"]
-ml-cpu-protected-generate:
- extends: [ ".ml-cpu-generate", ".protected-generate"]
+ml-linux-x86_64-cpu-protected-generate:
+ extends: [ ".ml-linux-x86_64-cpu-generate", ".protected-generate"]
-ml-cpu-pr-build:
- extends: [ ".ml-cpu", ".pr-build" ]
+ml-linux-x86_64-cpu-pr-build:
+ extends: [ ".ml-linux-x86_64-cpu", ".pr-build" ]
trigger:
include:
- artifact: jobs_scratch_dir/cloud-ci-pipeline.yml
- job: ml-cpu-pr-generate
+ job: ml-linux-x86_64-cpu-pr-generate
strategy: depend
needs:
- artifacts: True
- job: ml-cpu-pr-generate
+ job: ml-linux-x86_64-cpu-pr-generate
-ml-cpu-protected-build:
- extends: [ ".ml-cpu", ".protected-build" ]
+ml-linux-x86_64-cpu-protected-build:
+ extends: [ ".ml-linux-x86_64-cpu", ".protected-build" ]
trigger:
include:
- artifact: jobs_scratch_dir/cloud-ci-pipeline.yml
- job: ml-cpu-protected-generate
+ job: ml-linux-x86_64-cpu-protected-generate
strategy: depend
needs:
- artifacts: True
- job: ml-cpu-protected-generate
+ job: ml-linux-x86_64-cpu-protected-generate
########################################
-# Machine Learning (CUDA)
+# Machine Learning - Linux x86_64 (CUDA)
########################################
-.ml-cuda:
+.ml-linux-x86_64-cuda:
variables:
- SPACK_CI_STACK_NAME: ml-cuda
+ SPACK_CI_STACK_NAME: ml-linux-x86_64-cuda
-.ml-cuda-generate:
- extends: .ml-cuda
+.ml-linux-x86_64-cuda-generate:
+ extends: .ml-linux-x86_64-cuda
image: ghcr.io/spack/e4s-amazonlinux-2:v2022-03-21
tags: ["spack", "aws", "public", "medium", "x86_64_v4"]
-ml-cuda-pr-generate:
- extends: [ ".ml-cuda-generate", ".pr-generate"]
+ml-linux-x86_64-cuda-pr-generate:
+ extends: [ ".ml-linux-x86_64-cuda-generate", ".pr-generate"]
-ml-cuda-protected-generate:
- extends: [ ".ml-cuda-generate", ".protected-generate"]
+ml-linux-x86_64-cuda-protected-generate:
+ extends: [ ".ml-linux-x86_64-cuda-generate", ".protected-generate"]
-ml-cuda-pr-build:
- extends: [ ".ml-cuda", ".pr-build" ]
+ml-linux-x86_64-cuda-pr-build:
+ extends: [ ".ml-linux-x86_64-cuda", ".pr-build" ]
trigger:
include:
- artifact: jobs_scratch_dir/cloud-ci-pipeline.yml
- job: ml-cuda-pr-generate
+ job: ml-linux-x86_64-cuda-pr-generate
strategy: depend
needs:
- artifacts: True
- job: ml-cuda-pr-generate
+ job: ml-linux-x86_64-cuda-pr-generate
-ml-cuda-protected-build:
- extends: [ ".ml-cuda", ".protected-build" ]
+ml-linux-x86_64-cuda-protected-build:
+ extends: [ ".ml-linux-x86_64-cuda", ".protected-build" ]
trigger:
include:
- artifact: jobs_scratch_dir/cloud-ci-pipeline.yml
- job: ml-cuda-protected-generate
+ job: ml-linux-x86_64-cuda-protected-generate
strategy: depend
needs:
- artifacts: True
- job: ml-cuda-protected-generate
+ job: ml-linux-x86_64-cuda-protected-generate
########################################
-# Machine Learning (ROCm)
+# Machine Learning - Linux x86_64 (ROCm)
########################################
-.ml-rocm:
+.ml-linux-x86_64-rocm:
variables:
- SPACK_CI_STACK_NAME: ml-rocm
+ SPACK_CI_STACK_NAME: ml-linux-x86_64-rocm
-.ml-rocm-generate:
- extends: .ml-rocm
+.ml-linux-x86_64-rocm-generate:
+ extends: .ml-linux-x86_64-rocm
image: ghcr.io/spack/e4s-amazonlinux-2:v2022-03-21
tags: ["spack", "aws", "public", "medium", "x86_64_v4"]
-ml-rocm-pr-generate:
- extends: [ ".ml-rocm-generate", ".pr-generate"]
+ml-linux-x86_64-rocm-pr-generate:
+ extends: [ ".ml-linux-x86_64-rocm-generate", ".pr-generate"]
-ml-rocm-protected-generate:
- extends: [ ".ml-rocm-generate", ".protected-generate"]
+ml-linux-x86_64-rocm-protected-generate:
+ extends: [ ".ml-linux-x86_64-rocm-generate", ".protected-generate"]
-ml-rocm-pr-build:
- extends: [ ".ml-rocm", ".pr-build" ]
+ml-linux-x86_64-rocm-pr-build:
+ extends: [ ".ml-linux-x86_64-rocm", ".pr-build" ]
trigger:
include:
- artifact: jobs_scratch_dir/cloud-ci-pipeline.yml
- job: ml-rocm-pr-generate
+ job: ml-linux-x86_64-rocm-pr-generate
strategy: depend
needs:
- artifacts: True
- job: ml-rocm-pr-generate
+ job: ml-linux-x86_64-rocm-pr-generate
-ml-rocm-protected-build:
- extends: [ ".ml-rocm", ".protected-build" ]
+ml-linux-x86_64-rocm-protected-build:
+ extends: [ ".ml-linux-x86_64-rocm", ".protected-build" ]
trigger:
include:
- artifact: jobs_scratch_dir/cloud-ci-pipeline.yml
- job: ml-rocm-protected-generate
+ job: ml-linux-x86_64-rocm-protected-generate
strategy: depend
needs:
- artifacts: True
- job: ml-rocm-protected-generate
+ job: ml-linux-x86_64-rocm-protected-generate
diff --git a/share/spack/gitlab/cloud_pipelines/stacks/ml-cpu/spack.yaml b/share/spack/gitlab/cloud_pipelines/stacks/ml-linux-x86_64-cpu/spack.yaml
index ec2ac30b8a..bfd5020cea 100644
--- a/share/spack/gitlab/cloud_pipelines/stacks/ml-cpu/spack.yaml
+++ b/share/spack/gitlab/cloud_pipelines/stacks/ml-linux-x86_64-cpu/spack.yaml
@@ -16,77 +16,85 @@ spack:
packages:
all:
- compiler: [gcc@11.2.0]
target: [x86_64_v3]
variants: ~cuda~rocm
+ definitions:
+ - packages:
+ # Horovod
+ - py-horovod
+
+ # Hugging Face
+ - py-transformers
+
+ # JAX
+ - py-jax
+ - py-jaxlib
+
+ # Keras
+ - py-keras
+ - py-keras-applications
+ - py-keras-preprocessing
+ - py-keras2onnx
+
+ # PyTorch
+ - py-botorch
+ - py-efficientnet-pytorch
+ - py-gpytorch
+ - py-kornia
+ - py-pytorch-gradual-warmup-lr
+ - py-pytorch-lightning
+ - py-segmentation-models-pytorch
+ - py-timm
+ - py-torch
+ - py-torch-cluster
+ - py-torch-geometric
+ - py-torch-nvidia-apex
+ - py-torch-scatter
+ - py-torch-sparse
+ - py-torch-spline-conv
+ - py-torchaudio
+ - py-torchdata
+ - py-torchfile
+ - py-torchgeo
+ - py-torchmeta
+ - py-torchmetrics
+ - py-torchtext
+ - py-torchvision
+ - py-vector-quantize-pytorch
+
+ # scikit-learn
+ - py-scikit-learn
+ - py-scikit-learn-extra
+
+ # TensorBoard
+ - py-tensorboard
+ - py-tensorboard-data-server
+ - py-tensorboard-plugin-wit
+ - py-tensorboardx
+
+ # TensorFlow
+ - py-tensorflow
+ - py-tensorflow-datasets
+ - py-tensorflow-estimator
+ - py-tensorflow-hub
+ - py-tensorflow-metadata
+ - py-tensorflow-probability
+
+ # XGBoost
+ - py-xgboost
+ # - r-xgboost
+ - xgboost
+
+ - arch:
+ - target=x86_64_v3
+
specs:
- # Horovod
- - py-horovod
-
- # Hugging Face
- - py-transformers
-
- # JAX
- - py-jax
- - py-jaxlib
-
- # Keras
- - py-keras
- - py-keras-applications
- - py-keras-preprocessing
- - py-keras2onnx
-
- # PyTorch
- - py-botorch
- - py-efficientnet-pytorch
- - py-gpytorch
- - py-kornia
- - py-pytorch-gradual-warmup-lr
- - py-pytorch-lightning
- - py-segmentation-models-pytorch
- - py-timm
- - py-torch
- - py-torch-cluster
- - py-torch-geometric
- - py-torch-nvidia-apex
- - py-torch-scatter
- - py-torch-sparse
- - py-torch-spline-conv
- - py-torchaudio
- - py-torchdata
- - py-torchfile
- - py-torchgeo
- - py-torchmeta
- - py-torchmetrics
- - py-torchtext
- - py-torchvision
- - py-vector-quantize-pytorch
-
- # scikit-learn
- - py-scikit-learn
- - py-scikit-learn-extra
-
- # TensorBoard
- - py-tensorboard
- - py-tensorboard-data-server
- - py-tensorboard-plugin-wit
- - py-tensorboardx
-
- # TensorFlow
- - py-tensorflow
- - py-tensorflow-datasets
- - py-tensorflow-estimator
- - py-tensorflow-hub
- - py-tensorflow-metadata
- - py-tensorflow-probability
-
- # XGBoost
- - py-xgboost
- # - r-xgboost
- - xgboost
-
- mirrors: { "mirror": "s3://spack-binaries/develop/ml-cpu" }
+ - matrix:
+ - [$packages]
+ - [$arch]
+
+ mirrors: { "mirror": "s3://spack-binaries/develop/ml-linux-x86_64-cpu" }
gitlab-ci:
script:
@@ -113,6 +121,7 @@ spack:
mappings:
- match:
- llvm
+ - py-tensorflow
- py-torch
runner-attributes:
tags: [ "spack", "huge", "x86_64_v4" ]
diff --git a/share/spack/gitlab/cloud_pipelines/stacks/ml-cuda/spack.yaml b/share/spack/gitlab/cloud_pipelines/stacks/ml-linux-x86_64-cuda/spack.yaml
index d0c9823c40..4ab8e3698b 100644
--- a/share/spack/gitlab/cloud_pipelines/stacks/ml-cuda/spack.yaml
+++ b/share/spack/gitlab/cloud_pipelines/stacks/ml-linux-x86_64-cuda/spack.yaml
@@ -16,80 +16,88 @@ spack:
packages:
all:
- compiler: [gcc@11.2.0]
target: [x86_64_v3]
variants: ~rocm+cuda cuda_arch=80
llvm:
# https://github.com/spack/spack/issues/27999
require: ~cuda
+ definitions:
+ - packages:
+ # Horovod
+ - py-horovod
+
+ # Hugging Face
+ - py-transformers
+
+ # JAX
+ - py-jax
+ - py-jaxlib
+
+ # Keras
+ - py-keras
+ - py-keras-applications
+ - py-keras-preprocessing
+ - py-keras2onnx
+
+ # PyTorch
+ - py-botorch
+ - py-efficientnet-pytorch
+ - py-gpytorch
+ - py-kornia
+ - py-pytorch-gradual-warmup-lr
+ - py-pytorch-lightning
+ - py-segmentation-models-pytorch
+ - py-timm
+ - py-torch
+ - py-torch-cluster
+ - py-torch-geometric
+ - py-torch-nvidia-apex
+ - py-torch-scatter
+ - py-torch-sparse
+ - py-torch-spline-conv
+ - py-torchaudio
+ - py-torchdata
+ - py-torchfile
+ - py-torchgeo
+ - py-torchmeta
+ - py-torchmetrics
+ - py-torchtext
+ - py-torchvision
+ - py-vector-quantize-pytorch
+
+ # scikit-learn
+ - py-scikit-learn
+ - py-scikit-learn-extra
+
+ # TensorBoard
+ - py-tensorboard
+ - py-tensorboard-data-server
+ - py-tensorboard-plugin-wit
+ - py-tensorboardx
+
+ # TensorFlow
+ - py-tensorflow
+ - py-tensorflow-datasets
+ - py-tensorflow-estimator
+ - py-tensorflow-hub
+ - py-tensorflow-metadata
+ - py-tensorflow-probability
+
+ # XGBoost
+ - py-xgboost
+ # - r-xgboost
+ - xgboost
+
+ - arch:
+ - target=x86_64_v3
+
specs:
- # Horovod
- - py-horovod
-
- # Hugging Face
- - py-transformers
-
- # JAX
- - py-jax
- - py-jaxlib
-
- # Keras
- - py-keras
- - py-keras-applications
- - py-keras-preprocessing
- - py-keras2onnx
-
- # PyTorch
- - py-botorch
- - py-efficientnet-pytorch
- - py-gpytorch
- - py-kornia
- - py-pytorch-gradual-warmup-lr
- - py-pytorch-lightning
- - py-segmentation-models-pytorch
- - py-timm
- - py-torch
- - py-torch-cluster
- - py-torch-geometric
- - py-torch-nvidia-apex
- - py-torch-scatter
- - py-torch-sparse
- - py-torch-spline-conv
- - py-torchaudio
- - py-torchdata
- - py-torchfile
- - py-torchgeo
- - py-torchmeta
- - py-torchmetrics
- - py-torchtext
- - py-torchvision
- - py-vector-quantize-pytorch
-
- # scikit-learn
- - py-scikit-learn
- - py-scikit-learn-extra
-
- # TensorBoard
- - py-tensorboard
- - py-tensorboard-data-server
- - py-tensorboard-plugin-wit
- - py-tensorboardx
-
- # TensorFlow
- - py-tensorflow
- - py-tensorflow-datasets
- - py-tensorflow-estimator
- - py-tensorflow-hub
- - py-tensorflow-metadata
- - py-tensorflow-probability
-
- # XGBoost
- - py-xgboost
- # - r-xgboost
- - xgboost
-
- mirrors: { "mirror": "s3://spack-binaries/develop/ml-cuda" }
+ - matrix:
+ - [$packages]
+ - [$arch]
+
+ mirrors: { "mirror": "s3://spack-binaries/develop/ml-linux-x86_64-cuda" }
gitlab-ci:
script:
@@ -116,6 +124,7 @@ spack:
mappings:
- match:
- llvm
+ - py-tensorflow
- py-torch
runner-attributes:
tags: [ "spack", "huge", "x86_64_v4" ]
diff --git a/share/spack/gitlab/cloud_pipelines/stacks/ml-rocm/spack.yaml b/share/spack/gitlab/cloud_pipelines/stacks/ml-linux-x86_64-rocm/spack.yaml
index 601327ec7e..29cf0aabe0 100644
--- a/share/spack/gitlab/cloud_pipelines/stacks/ml-rocm/spack.yaml
+++ b/share/spack/gitlab/cloud_pipelines/stacks/ml-linux-x86_64-rocm/spack.yaml
@@ -16,7 +16,6 @@ spack:
packages:
all:
- compiler: [gcc@11.2.0]
target: [x86_64_v3]
variants: ~cuda+rocm amdgpu_target=gfx90a
gl:
@@ -25,74 +24,83 @@ spack:
# Does not yet support Spack-installed ROCm
require: ~rocm
+ definitions:
+ - packages:
+ # Horovod
+ - py-horovod
+
+ # Hugging Face
+ - py-transformers
+
+ # JAX
+ - py-jax
+ - py-jaxlib
+
+ # Keras
+ - py-keras
+ - py-keras-applications
+ - py-keras-preprocessing
+ - py-keras2onnx
+
+ # PyTorch
+ # Does not yet support Spack-install ROCm
+ # - py-botorch
+ # - py-efficientnet-pytorch
+ # - py-gpytorch
+ # - py-kornia
+ # - py-pytorch-gradual-warmup-lr
+ # - py-pytorch-lightning
+ # - py-segmentation-models-pytorch
+ # - py-timm
+ # - py-torch
+ # - py-torch-cluster
+ # - py-torch-geometric
+ # - py-torch-nvidia-apex
+ # - py-torch-scatter
+ # - py-torch-sparse
+ # - py-torch-spline-conv
+ # - py-torchaudio
+ # - py-torchdata
+ # - py-torchfile
+ # - py-torchgeo
+ # - py-torchmeta
+ # - py-torchmetrics
+ # - py-torchtext
+ # - py-torchvision
+ # - py-vector-quantize-pytorch
+
+ # scikit-learn
+ - py-scikit-learn
+ - py-scikit-learn-extra
+
+ # TensorBoard
+ - py-tensorboard
+ - py-tensorboard-data-server
+ - py-tensorboard-plugin-wit
+ - py-tensorboardx
+
+ # TensorFlow
+ - py-tensorflow
+ - py-tensorflow-datasets
+ - py-tensorflow-estimator
+ - py-tensorflow-hub
+ - py-tensorflow-metadata
+ - py-tensorflow-probability
+
+ # XGBoost
+ - py-xgboost
+ # - r-xgboost
+ - xgboost
+
+ - arch:
+ - target=x86_64_v3
+
specs:
- # Horovod
- - py-horovod
-
- # Hugging Face
- - py-transformers
-
- # JAX
- - py-jax
- - py-jaxlib
-
- # Keras
- - py-keras
- - py-keras-applications
- - py-keras-preprocessing
- - py-keras2onnx
-
- # PyTorch
- # Does not yet support Spack-install ROCm
- # - py-botorch
- # - py-efficientnet-pytorch
- # - py-gpytorch
- # - py-kornia
- # - py-pytorch-gradual-warmup-lr
- # - py-pytorch-lightning
- # - py-segmentation-models-pytorch
- # - py-timm
- # - py-torch
- # - py-torch-cluster
- # - py-torch-geometric
- # - py-torch-nvidia-apex
- # - py-torch-scatter
- # - py-torch-sparse
- # - py-torch-spline-conv
- # - py-torchaudio
- # - py-torchdata
- # - py-torchfile
- # - py-torchgeo
- # - py-torchmeta
- # - py-torchmetrics
- # - py-torchtext
- # - py-torchvision
- # - py-vector-quantize-pytorch
-
- # scikit-learn
- - py-scikit-learn
- - py-scikit-learn-extra
-
- # TensorBoard
- - py-tensorboard
- - py-tensorboard-data-server
- - py-tensorboard-plugin-wit
- - py-tensorboardx
-
- # TensorFlow
- - py-tensorflow
- - py-tensorflow-datasets
- - py-tensorflow-estimator
- - py-tensorflow-hub
- - py-tensorflow-metadata
- - py-tensorflow-probability
-
- # XGBoost
- - py-xgboost
- # - r-xgboost
- - xgboost
-
- mirrors: { "mirror": "s3://spack-binaries/develop/ml-rocm" }
+ - matrix:
+ - [$packages]
+ - [$arch]
+
+ mirrors: { "mirror": "s3://spack-binaries/develop/ml-linux-x86_64-rocm" }
gitlab-ci:
script:
@@ -118,8 +126,9 @@ spack:
match_behavior: first
mappings:
- match:
- - llvm-amdgpu
- llvm
+ - llvm-amdgpu
+ - py-tensorflow
- py-torch
- rocblas
runner-attributes: