-
Notifications
You must be signed in to change notification settings - Fork 27
/
Copy path.gitlab-ci.yml
151 lines (146 loc) · 6.41 KB
/
.gitlab-ci.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
variables:
H5BENCH_BUILD_PATH: "${CI_PROJECT_DIR}/build"
H5BENCH_INSTALL_PATH: "${CI_PROJECT_DIR}/install"
stages:
- build
- test
- metrics
build-perlmutter:
stage: build
when: manual
allow_failure: false
id_tokens:
SITE_ID_TOKEN:
aud: https://software.nersc.gov/
rules:
- if: '$METRICS == null'
tags:
- perlmutter
variables:
GIT_SUBMODULE_STRATEGY: recursive
SCHEDULER_PARAMETERS: " -A m2621 --qos=debug --constraint=cpu --tasks-per-node=64 -N 1 -t 00:30:00"
HDF5_DIR: "/global/cfs/cdirs/m2621/h5bench-perlmutter/hdf5/install"
HDF5_HOME: "/global/cfs/cdirs/m2621/h5bench-perlmutter/hdf5/install"
script:
- echo "Build h5bench"
- module list
- module load cmake
- mkdir -p ${H5BENCH_BUILD_PATH}/perlmutter
- cd ${H5BENCH_BUILD_PATH}/perlmutter
- cmake ../.. -DCMAKE_INSTALL_PREFIX=${H5BENCH_INSTALL_PATH}/perlmutter -DH5BENCH_ALL=ON
- make -j 8
- make install
artifacts:
paths:
- ${H5BENCH_BUILD_PATH}/perlmutter
- ${H5BENCH_INSTALL_PATH}/perlmutter
test-perlmutter:
stage: test
id_tokens:
SITE_ID_TOKEN:
aud: https://software.nersc.gov/
rules:
- if: '$METRICS == null'
needs: ["build-perlmutter"]
tags:
- perlmutter
variables:
SCHEDULER_PARAMETERS: " -A m2621 --qos=debug --constraint=cpu --tasks-per-node=64 -N 1 -t 00:30:00"
HDF5_DIR: "/global/cfs/cdirs/m2621/h5bench-perlmutter/hdf5/install"
HDF5_HOME: "/global/cfs/cdirs/m2621/h5bench-perlmutter/hdf5/install"
MPICH_MAX_THREAD_SAFETY: "multiple"
script:
- echo "Test h5bench SYNC"
- cd ${H5BENCH_BUILD_PATH}/perlmutter
- export LD_LIBRARY_PATH=$HDF5_DIR/lib:$H5BENCH_INSTALL_PATH/perlmutter/lib:$LD_LIBRARY_PATH
- echo "Test h5bench SYNC write/read"
- python3 ../../samples/update-perlmutter.py ../../samples/sync-write-read-contig-1d-small.json
- ./h5bench --debug --abort-on-failure --validate-mode ../../samples/sync-write-read-contig-1d-small.json
- echo "Test h5bench SYNC write unlimited"
- python3 ../../samples/update-perlmutter.py ../../samples/sync-write-unlimited.json
- ./h5bench --debug --abort-on-failure ../../samples/sync-write-unlimited.json
- echo "Test h5bench SYNC overwrite"
- python3 ../../samples/update-perlmutter.py ../../samples/sync-overwrite.json
- ./h5bench --debug --abort-on-failure ../../samples/sync-overwrite.json
- echo "Test h5bench SYNC append"
- python3 ../../samples/update-perlmutter.py ../../samples/sync-append.json
- ./h5bench --debug --abort-on-failure ../../samples/sync-append.json
- echo "Test h5bench SYNC exerciser"
- python3 ../../samples/update-perlmutter.py ../../samples/sync-exerciser.json
- ./h5bench --debug --abort-on-failure ../../samples/sync-exerciser.json
- echo "Test h5bench SYNC metadata"
- python3 ../../samples/update-perlmutter.py ../../samples/sync-metadata.json
- ./h5bench --debug --abort-on-failure ../../samples/sync-metadata.json
- echo "Test h5bench SYNC amrex"
- python3 ../../samples/update-perlmutter.py ../../samples/sync-amrex.json
- ./h5bench --debug --abort-on-failure ../../samples/sync-amrex.json
- echo "Test h5bench SYNC openpmd"
- python3 ../../samples/update-perlmutter.py ../../samples/sync-openpmd.json
- ./h5bench --debug --abort-on-failure ../../samples/sync-openpmd.json
build-perlmutter-metrics:
stage: build
id_tokens:
SITE_ID_TOKEN:
aud: https://software.nersc.gov/
rules:
- if: '$CI_PIPELINE_SOURCE == "schedule" && $METRICS == "true"'
tags:
- perlmutter
variables:
GIT_SUBMODULE_STRATEGY: recursive
SCHEDULER_PARAMETERS: " -A m2621 --qos=debug --constraint=cpu --tasks-per-node=64 -N 1 -t 00:30:00"
HDF5_DIR: "/global/cfs/cdirs/m2621/h5bench-perlmutter/hdf5/install"
HDF5_HOME: "/global/cfs/cdirs/m2621/h5bench-perlmutter/hdf5/install"
script:
- echo "Build h5bench"
- module list
- module load cmake
- mkdir -p ${H5BENCH_BUILD_PATH}/perlmutter-metrics
- cd ${H5BENCH_BUILD_PATH}/perlmutter-metrics
- cmake ../.. -DCMAKE_INSTALL_PREFIX=${H5BENCH_INSTALL_PATH}/perlmutter-metrics
- make -j 8
- make install
artifacts:
paths:
- ${H5BENCH_BUILD_PATH}/perlmutter-metrics
- ${H5BENCH_INSTALL_PATH}/perlmutter-metrics
metrics-perlmutter:
stage: metrics
id_tokens:
SITE_ID_TOKEN:
aud: https://software.nersc.gov/
rules:
- if: '$CI_PIPELINE_SOURCE == "schedule" && $METRICS == "true"'
needs: ["build-perlmutter-metrics"]
tags:
- perlmutter
variables:
SCHEDULER_PARAMETERS: " -A m2621 --qos=debug --constraint=cpu --tasks-per-node=64 -N 8 -t 00:30:00"
HDF5_DIR: "/global/cfs/cdirs/m2621/h5bench-perlmutter/hdf5/install"
HDF5_HOME: "/global/cfs/cdirs/m2621/h5bench-perlmutter/hdf5/install"
MPICH_MAX_THREAD_SAFETY: "multiple"
script:
- hostname
- echo "JOBID ${SLURM_JOB_ID}"
- export NERSC_HOST=`cat /etc/clustername`
- module load python
- module load darshan
- echo "h5bench SYNC"
- cd ${H5BENCH_BUILD_PATH}/perlmutter-metrics
- export LD_LIBRARY_PATH=$HDF5_DIR/lib:$LD_LIBRARY_PATH
- echo "Run h5bench SYNC write/read"
- ./h5bench --debug --abort-on-failure --validate-mode ../../samples/metrics-perlmutter.json 2> h5bench-suite-sync.err 1> h5bench-suite-sync.out
- echo "Install dependencies"
- pip install pydrive gspread gspread-dataframe google
- echo "Store h5bench metrics"
- python3 ../../workflows/store-metrics.py Perlmutter
- echo "Removing files"
- rm storage-metrics/*.h5
- export RESULTS="/global/homes/j/jeanbez/h5bench-ci-metrics/perlmutter/$(date +%s)"
- mkdir -p $RESULTS
- echo "Fetching Darshan log file"
- cp /pscratch/darshanlogs/$(date +%Y)/$(date +%-m)/$(date +%d | sed 's/^0*//')/jeanbez_h5bench* ${RESULTS} 2> /dev/null || true
- echo "Fetching runtime files"
- cp h5bench-suite-sync.err ${RESULTS}
- cp h5bench-suite-sync.out ${RESULTS}
- cp -r storage-metrics/* ${RESULTS}