@@ -508,23 +508,10 @@ steps:
508
508
--data_dir prep_remap/output_active --out_dir remap_pipeline_output
509
509
artifact_paths : " remap_pipeline_output/*"
510
510
511
- - group : " Configs"
512
- steps :
513
-
514
- # TODO: we should somehow decouple this unit test from the perf env / scripts
515
- - label : " :computer: checkbounds"
516
- command : >
517
- julia --color=yes --check-bounds=yes --project=.buildkite perf/benchmark.jl
518
- --config_file $PERF_CONFIG_PATH/checkbounds.yml
519
- --job_id checkbounds
520
- artifact_paths : " checkbounds/output_active/*"
521
- agents :
522
- slurm_mem : 20GB
523
-
524
511
- group : " EDOnlyEDMFX"
525
512
steps :
526
513
527
- - label : " :man_in_business_suit_levitating: EDOnlyEDMFX test on a sphere "
514
+ - label : " :man_in_business_suit_levitating: EDOnly EDMFX aquaplanet "
528
515
command : >
529
516
julia --color=yes --project=.buildkite .buildkite/ci_driver.jl
530
517
--config_file $CONFIG_PATH/edonly_edmfx_aquaplanet.yml
@@ -533,18 +520,6 @@ steps:
533
520
agents :
534
521
slurm_mem : 20GB
535
522
536
- - label : " :man_in_business_suit_levitating: EDOnlyEDMFX test on a sphere GPU"
537
- command : >
538
- julia --color=yes --project=.buildkite .buildkite/ci_driver.jl
539
- --config_file $CONFIG_PATH/edonly_edmfx_aquaplanet.yml
540
- --job_id edonly_edmfx_aquaplanet_gpu
541
- artifact_paths : " edonly_edmfx_aquaplanet_gpu/output_active/*"
542
- env :
543
- CLIMACOMMS_DEVICE : " CUDA"
544
- agents :
545
- slurm_mem : 20GB
546
- slurm_gpus : 1
547
-
548
523
- group : " Diagnostic EDMFX"
549
524
steps :
550
525
@@ -647,7 +622,7 @@ steps:
647
622
agents :
648
623
slurm_mem : 20GB
649
624
650
- - label : " :genie: Diagnostic EDMFX aquaplanet with TKE "
625
+ - label : " :genie: Diagnostic EDMFX aquaplanet"
651
626
command : >
652
627
julia --color=yes --project=.buildkite .buildkite/ci_driver.jl
653
628
--config_file $CONFIG_PATH/diagnostic_edmfx_aquaplanet.yml
@@ -682,6 +657,15 @@ steps:
682
657
artifact_paths : " prognostic_edmfx_simpleplume_column/output_active/*"
683
658
agents :
684
659
slurm_mem : 20GB
660
+
661
+ - label : " :genie: Prognostic EDMFX Soares in a column"
662
+ command : >
663
+ julia --color=yes --project=.buildkite .buildkite/ci_driver.jl
664
+ --config_file $CONFIG_PATH/prognostic_edmfx_soares_column.yml
665
+ --job_id prognostic_edmfx_soares_column
666
+ artifact_paths : " prognostic_edmfx_soares_column/output_active/*"
667
+ agents :
668
+ slurm_mem : 20GB
685
669
686
670
- label : " :genie: Prognostic EDMFX GABLS in a column"
687
671
command : >
@@ -803,15 +787,6 @@ steps:
803
787
agents :
804
788
slurm_mem : 20GB
805
789
806
- - label : " :genie: Prognostic EDMFX Soares in a column"
807
- command : >
808
- julia --color=yes --project=.buildkite .buildkite/ci_driver.jl
809
- --config_file $CONFIG_PATH/prognostic_edmfx_soares_column.yml
810
- --job_id prognostic_edmfx_soares_column
811
- artifact_paths : " prognostic_edmfx_soares_column/output_active/*"
812
- agents :
813
- slurm_mem : 20GB
814
-
815
790
- group : " GPU"
816
791
steps :
817
792
@@ -923,31 +898,29 @@ steps:
923
898
slurm_gpus : 1
924
899
slurm_mem : 16G
925
900
926
- - label : " :umbrella: GPU: gpu_aquaplanet_dyamond"
927
- command :
928
- - mkdir -p gpu_aquaplanet_dyamond
929
- - >
930
- julia --color=yes --project=.buildkite .buildkite/ci_driver.jl
931
- --config_file ${CONFIG_PATH}/gpu_aquaplanet_dyamond.yml
932
- --job_id gpu_aquaplanet_dyamond
933
- artifact_paths : " gpu_aquaplanet_dyamond/output_active/*"
901
+ - label : " GPU: test DYAMOND interpolated initial conditions"
902
+ command : >
903
+ julia --color=yes --project=.buildkite .buildkite/ci_driver.jl
904
+ --config_file $GPU_CONFIG_PATH/gpu_aquaplanet_dyamond_summer.yml
905
+ --job_id gpu_aquaplanet_dyamond_summer
906
+ artifact_paths : " gpu_aquaplanet_dyamond_summer/output_active/*"
934
907
env :
935
908
CLIMACOMMS_DEVICE : " CUDA"
936
909
agents :
937
910
slurm_gpus : 1
938
911
slurm_mem : 16G
939
912
940
- - label : " GPU: test DYAMOND interpolated initial conditions "
913
+ - label : " GPU: EDOnly EDMFX aquaplanet "
941
914
command : >
942
915
julia --color=yes --project=.buildkite .buildkite/ci_driver.jl
943
- --config_file $GPU_CONFIG_PATH/gpu_aquaplanet_dyamond_summer .yml
944
- --job_id gpu_aquaplanet_dyamond_summer
945
- artifact_paths : " gpu_aquaplanet_dyamond_summer /output_active/*"
916
+ --config_file $CONFIG_PATH/edonly_edmfx_aquaplanet .yml
917
+ --job_id edonly_edmfx_aquaplanet_gpu
918
+ artifact_paths : " edonly_edmfx_aquaplanet_gpu /output_active/*"
946
919
env :
947
920
CLIMACOMMS_DEVICE : " CUDA"
948
921
agents :
922
+ slurm_mem : 20GB
949
923
slurm_gpus : 1
950
- slurm_mem : 16G
951
924
952
925
- label : " GPU: Diagnostic EDMFX aquaplanet"
953
926
key : " diagnostic_edmfx_aquaplanet_gpu"
@@ -977,47 +950,34 @@ steps:
977
950
- group : " Benchmarks"
978
951
steps :
979
952
980
- - label : " :computer: Benchmark: GPU implicit baro wave"
953
+ - label : " :computer: Benchmark: CPU baroclinic wave moist "
981
954
command : >
982
-
983
955
julia --color=yes --project=.buildkite perf/benchmark_step.jl
984
- --config_file $PERF_CONFIG_PATH/gpu_implicit_barowave.yml
985
- --job_id gpu_implicit_barowave
986
- artifact_paths : " gpu_implicit_barowave/output_active/*"
987
- env :
988
- CLIMACOMMS_DEVICE : " CUDA"
989
- agents :
990
- slurm_gpus : 1
956
+ --config_file $PERF_CONFIG_PATH/bm_baroclinic_wave_moist.yml
957
+ --job_id bm_baroclinic_wave_moist
958
+ artifact_paths : " bm_baroclinic_wave_moist/output_active/*"
991
959
992
- - label : " :computer: Benchmark: GPU implicit baro wave moist"
960
+ - label : " :computer: Benchmark: GPU baroclinic wave moist"
993
961
command : >
994
962
995
963
julia --color=yes --project=.buildkite perf/benchmark_step.jl
996
- --config_file $PERF_CONFIG_PATH/gpu_implicit_barowave_moist .yml
997
- --job_id gpu_implicit_barowave_moist
998
- artifact_paths : " gpu_implicit_barowave_moist /output_active/*"
964
+ --config_file $PERF_CONFIG_PATH/bm_baroclinic_wave_moist .yml
965
+ --job_id bm_baroclinic_wave_moist_gpu
966
+ artifact_paths : " bm_baroclinic_wave_moist_gpu /output_active/*"
999
967
env :
1000
968
CLIMACOMMS_DEVICE : " CUDA"
1001
969
agents :
1002
970
slurm_mem : 16G
1003
971
slurm_gpus : 1
1004
972
1005
- - label : " :computer: Benchmark: CPU implicit baro wave"
1006
- command : >
1007
- julia --color=yes --project=.buildkite perf/benchmark_step.jl
1008
- --config_file $PERF_CONFIG_PATH/cpu_implicit_barowave.yml
1009
- --job_id cpu_implicit_barowave
1010
- artifact_paths : " cpu_implicit_barowave/output_active/*"
1011
-
1012
- # Benchmarks
1013
973
- label : " :computer: Benchmark: CPU perf target (default)"
1014
974
command : >
1015
975
julia --color=yes --project=.buildkite perf/benchmark.jl
1016
976
--config_file $PERF_CONFIG_PATH/bm_perf_target.yml
1017
977
--job_id bm_perf_target
1018
978
agents :
1019
979
slurm_mem : 24GB
1020
-
980
+
1021
981
- label : " :computer: Benchmark: GPU perf target"
1022
982
command : >
1023
983
julia --color=yes --project=.buildkite perf/benchmark.jl
@@ -1055,6 +1015,19 @@ steps:
1055
1015
- group : " Flame graphs"
1056
1016
steps :
1057
1017
1018
+ - label : " :fire: Flame graph: gpu job"
1019
+ command : >
1020
+ julia --color=yes --project=.buildkite perf/flame.jl
1021
+ --config_file $PERF_CONFIG_PATH/bm_baroclinic_wave_moist.yml
1022
+ --job_id flame_baroclinic_wave_moist_gpu
1023
+ artifact_paths : " flame_baroclinic_wave_moist_gpu/*"
1024
+ env :
1025
+ CLIMACOMMS_DEVICE : " CUDA"
1026
+ agents :
1027
+ slurm_mem : 48GB
1028
+ slurm_gpus : 1
1029
+ gres : " gpu:p100:1"
1030
+
1058
1031
- label : " :fire: Flame graph: perf target (default)"
1059
1032
command : >
1060
1033
julia --color=yes --project=.buildkite perf/flame.jl
@@ -1072,6 +1045,15 @@ steps:
1072
1045
artifact_paths : " flame_perf_target_tracers/*"
1073
1046
agents :
1074
1047
slurm_mem : 24GB
1048
+
1049
+ - label : " :fire: Flame graph: perf target (diagnostics)"
1050
+ command : >
1051
+ julia --color=yes --project=.buildkite perf/flame.jl
1052
+ --config_file $PERF_CONFIG_PATH/flame_perf_diagnostics.yml
1053
+ --job_id flame_perf_diagnostics
1054
+ artifact_paths : " flame_perf_diagnostics/*"
1055
+ agents :
1056
+ slurm_mem : 24GB
1075
1057
1076
1058
- label : " :fire: Flame graph: perf target (diagnostic edmfx)"
1077
1059
command : >
@@ -1082,12 +1064,12 @@ steps:
1082
1064
agents :
1083
1065
slurm_mem : 24GB
1084
1066
1085
- - label : " :fire: Flame graph: perf target (prognostic edmfx aquaplanet )"
1067
+ - label : " :fire: Flame graph: perf target (prognostic edmfx)"
1086
1068
command : >
1087
1069
julia --color=yes --project=.buildkite perf/flame.jl
1088
- --config_file $PERF_CONFIG_PATH/flame_perf_target_prognostic_edmfx_aquaplanet .yml
1089
- --job_id flame_perf_target_prognostic_edmfx_aquaplanet
1090
- artifact_paths : " flame_perf_target_prognostic_edmfx_aquaplanet /*"
1070
+ --config_file $PERF_CONFIG_PATH/flame_perf_target_prognostic_edmfx .yml
1071
+ --job_id flame_perf_target_prognostic_edmfx
1072
+ artifact_paths : " flame_perf_target_prognostic_edmfx /*"
1091
1073
agents :
1092
1074
slurm_mem : 32GB
1093
1075
@@ -1118,36 +1100,25 @@ steps:
1118
1100
agents :
1119
1101
slurm_mem : 24GB
1120
1102
1121
- - label : " :fire: Flame graph: perf target (diagnostics)"
1122
- command : >
1123
- julia --color=yes --project=.buildkite perf/flame.jl
1124
- --config_file $PERF_CONFIG_PATH/flame_perf_diagnostics.yml
1125
- --job_id flame_perf_diagnostics
1126
- artifact_paths : " flame_perf_diagnostics/*"
1127
- agents :
1128
- slurm_mem : 24GB
1103
+ - group : " Checkbounds/Inference/Invalidations"
1104
+ steps :
1129
1105
1130
- - label : " :fire: Flame graph: gpu job"
1106
+ # TODO: we should somehow decouple this unit test from the perf env / scripts
1107
+ # Checkbounds
1108
+ - label : " :computer: checkbounds"
1131
1109
command : >
1132
- julia --color=yes --project=.buildkite perf/flame.jl
1133
- --config_file $PERF_CONFIG_PATH/flame_gpu_implicit_barowave_moist.yml
1134
- --job_id flame_gpu_implicit_barowave_moist
1135
- artifact_paths : " flame_gpu_implicit_barowave_moist/*"
1136
- env :
1137
- CLIMACOMMS_DEVICE : " CUDA"
1110
+ julia --color=yes --check-bounds=yes --project=.buildkite perf/benchmark.jl
1111
+ --config_file $PERF_CONFIG_PATH/flame_perf_target.yml
1112
+ --job_id checkbounds
1113
+ artifact_paths : " checkbounds/output_active/*"
1138
1114
agents :
1139
- slurm_mem : 48GB
1140
- slurm_gpus : 1
1141
- gres : " gpu:p100:1"
1142
-
1143
- - group : " Inference/Invalidations"
1144
- steps :
1115
+ slurm_mem : 20GB
1145
1116
1146
1117
# Inference
1147
1118
- label : " :rocket: JET n-failures (inference)"
1148
1119
command : >
1149
1120
julia --color=yes --project=.buildkite perf/jet_test_nfailures.jl
1150
- --config_file $PERF_CONFIG_PATH/jet_n_failures .yml
1121
+ --config_file $PERF_CONFIG_PATH/flame_perf_target .yml
1151
1122
--job_id jet_n_failures
1152
1123
agents :
1153
1124
slurm_mem : 24GB
@@ -1156,6 +1127,7 @@ steps:
1156
1127
- label : " :mag::rocket: Invalidations"
1157
1128
command : >
1158
1129
julia --color=yes --project=.buildkite perf/invalidations.jl
1130
+ --config_file $PERF_CONFIG_PATH/flame_perf_target.yml
1159
1131
artifact_paths : " invalidations/*"
1160
1132
agents :
1161
1133
slurm_mem : 24GB
0 commit comments