Skip to content

Commit f655899

Browse files
clean up of configs for cmip examples
1 parent b11a8e3 commit f655899

File tree

3 files changed

+87
-1
lines changed

3 files changed

+87
-1
lines changed
Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -38,6 +38,6 @@ output_file_template: ['variable_id','table_id','source_id','experiment_id','mem
3838

3939
#######################################################
4040

41-
input_path: "/uda/CMIP6/CMIP/NOAA-GFDL/GFDL-ESM4/"
41+
input_path: "/uda/CMIP6/CMIP/NOAA-GFDL/"
4242
#"/archive/am5/am5/am5f3b1r0/c96L65_am5f3b1r0_pdclim1850F/gfdl.ncrc5-deploy-prod-openmp/pp/" #"ENTER INPUT PATH HERE" #Example: /Users/ar46/archive/am5/am5/am5f3b1r0/c96L65_am5f3b1r0_pdclim1850F/gfdl.ncrc5-deploy-prod-openmp/pp/"
4343
output_path: "catalogcmip" # ENTER NAME OF THE CSV AND JSON, THE SUFFIX ALONE. e.g catalog (the builder then generates catalog.csv and catalog.json. This can also be an absolute path)

configs/config-cmip-esm4.yaml

Lines changed: 43 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,43 @@
1+
#what kind of directory structure to expect?
2+
#For a directory structure like /archive/am5/am5/am5f3b1r0/c96L65_am5f3b1r0_pdclim1850F/gfdl.ncrc5-deploy-prod-openmp/pp
3+
# the output_path_template is set as follows.
4+
#We have NA in those values that do not match up with any of the expected headerlist (CSV columns), otherwise we
5+
#simply specify the associated header name in the appropriate place. E.g. The third directory in the PP path example
6+
#above is the model (source_id), so the third list value in output_path_template is set to 'source_id'. We make sure
7+
#this is a valid value in headerlist as well.
8+
#The fourth directory is am5f3b1r0 which does not map to an existing header value. So we simply NA in output_path_template
9+
#for the fourth value.
10+
11+
#catalog headers
12+
#The headerlist is expected column names in your catalog/csv file. This is usually determined by the users in conjuction
13+
#with the ESM collection specification standards and the appropriate workflows.
14+
15+
headerlist: ["activity_id", "institution_id", "source_id", "experiment_id",
16+
"frequency", "realm", "table_id",
17+
"member_id", "grid_label", "variable_id","version_id",
18+
"time_range", "chunk_freq","platform","dimensions","cell_methods","path"]
19+
20+
#what kind of directory structure to expect?
21+
#For a directory structure like /archive/am5/am5/am5f3b1r0/c96L65_am5f3b1r0_pdclim1850F/gfdl.ncrc5-deploy-prod-openmp/pp
22+
# the output_path_template is set as follows.
23+
#We have NA in those values that do not match up with any of the expected headerlist (CSV columns), otherwise we
24+
#simply specify the associated header name in the appropriate place. E.g. The third directory in the PP path example
25+
#above is the model (source_id), so the third list value in output_path_template is set to 'source_id'. We make sure
26+
#this is a valid value in headerlist as well.
27+
#The fourth directory is am5f3b1r0 which does not map to an existing header value. So we simply NA in output_path_template
28+
#for the fourth value.
29+
#project_dir = "/uda/data_cmip6/CMIP6/CMIP/NOAA-GFDL/GFDL-ESM4/"
30+
#/uda/CMIP6/CMIP/NOAA-GFDL/GFDL-ESM4/1pctCO2/r1i1p1f1/Amon/tas/gr1/v20180701/tas_Amon_GFDL-ESM4_1pctCO2_r1i1p1f1_gr1_000101-010012.nc
31+
output_path_template: ['NA','activity_id','NA','institution_id','source_id','experiment_id','member_id','table_id','variable_id','grid_label','version_id']
32+
33+
output_file_template: ['variable_id','table_id','source_id','experiment_id','member_id','grid_label','time_range']
34+
35+
#OUTPUT FILE INFO is currently passed as command-line argument.
36+
#We will revisit adding a csvfile, jsonfile and logfile configuration to the builder configuration file in the future.
37+
#csvfile = #jsonfile = #logfile =
38+
39+
#######################################################
40+
41+
input_path: "/uda/CMIP6/CMIP/NOAA-GFDL/GFDL-ESM4/"
42+
#"/archive/am5/am5/am5f3b1r0/c96L65_am5f3b1r0_pdclim1850F/gfdl.ncrc5-deploy-prod-openmp/pp/" #"ENTER INPUT PATH HERE" #Example: /Users/ar46/archive/am5/am5/am5f3b1r0/c96L65_am5f3b1r0_pdclim1850F/gfdl.ncrc5-deploy-prod-openmp/pp/"
43+
output_path: "catalogcmiptest" # ENTER NAME OF THE CSV AND JSON, THE SUFFIX ALONE. e.g catalog (the builder then generates catalog.csv and catalog.json. This can also be an absolute path)

configs/config-uda-cmip.yaml

Lines changed: 43 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,43 @@
1+
#what kind of directory structure to expect?
2+
#For a directory structure like /archive/am5/am5/am5f3b1r0/c96L65_am5f3b1r0_pdclim1850F/gfdl.ncrc5-deploy-prod-openmp/pp
3+
# the output_path_template is set as follows.
4+
#We have NA in those values that do not match up with any of the expected headerlist (CSV columns), otherwise we
5+
#simply specify the associated header name in the appropriate place. E.g. The third directory in the PP path example
6+
#above is the model (source_id), so the third list value in output_path_template is set to 'source_id'. We make sure
7+
#this is a valid value in headerlist as well.
8+
#The fourth directory is am5f3b1r0 which does not map to an existing header value. So we simply NA in output_path_template
9+
#for the fourth value.
10+
11+
#catalog headers
12+
#The headerlist is expected column names in your catalog/csv file. This is usually determined by the users in conjuction
13+
#with the ESM collection specification standards and the appropriate workflows.
14+
15+
headerlist: ["activity_id", "institution_id", "source_id", "experiment_id",
16+
"frequency", "realm", "table_id",
17+
"member_id", "grid_label", "variable_id","version_id",
18+
"time_range", "chunk_freq","platform","dimensions","cell_methods","path"]
19+
20+
#what kind of directory structure to expect?
21+
#For a directory structure like /archive/am5/am5/am5f3b1r0/c96L65_am5f3b1r0_pdclim1850F/gfdl.ncrc5-deploy-prod-openmp/pp
22+
# the output_path_template is set as follows.
23+
#We have NA in those values that do not match up with any of the expected headerlist (CSV columns), otherwise we
24+
#simply specify the associated header name in the appropriate place. E.g. The third directory in the PP path example
25+
#above is the model (source_id), so the third list value in output_path_template is set to 'source_id'. We make sure
26+
#this is a valid value in headerlist as well.
27+
#The fourth directory is am5f3b1r0 which does not map to an existing header value. So we simply NA in output_path_template
28+
#for the fourth value.
29+
#project_dir = "/uda/data_cmip6/CMIP6/CMIP/NOAA-GFDL/GFDL-ESM4/"
30+
#/uda/CMIP6/CMIP/NOAA-GFDL/GFDL-ESM4/1pctCO2/r1i1p1f1/Amon/tas/gr1/v20180701/tas_Amon_GFDL-ESM4_1pctCO2_r1i1p1f1_gr1_000101-010012.nc
31+
output_path_template: ['NA','activity_id','NA','institution_id','source_id','experiment_id','member_id','table_id','variable_id','grid_label','version_id']
32+
33+
output_file_template: ['variable_id','table_id','source_id','experiment_id','member_id','grid_label','time_range']
34+
35+
#OUTPUT FILE INFO is currently passed as command-line argument.
36+
#We will revisit adding a csvfile, jsonfile and logfile configuration to the builder configuration file in the future.
37+
#csvfile = #jsonfile = #logfile =
38+
39+
#######################################################
40+
41+
input_path: "/uda/CMIP6/CMIP/NOAA-GFDL/"
42+
#"/archive/am5/am5/am5f3b1r0/c96L65_am5f3b1r0_pdclim1850F/gfdl.ncrc5-deploy-prod-openmp/pp/" #"ENTER INPUT PATH HERE" #Example: /Users/ar46/archive/am5/am5/am5f3b1r0/c96L65_am5f3b1r0_pdclim1850F/gfdl.ncrc5-deploy-prod-openmp/pp/"
43+
output_path: "catalogcmip" # ENTER NAME OF THE CSV AND JSON, THE SUFFIX ALONE. e.g catalog (the builder then generates catalog.csv and catalog.json. This can also be an absolute path)

0 commit comments

Comments
 (0)