Skip to content

Commit db1f74c

Browse files
Zach MarshallZach Marshall
authored andcommitted
Fixing a few formatting issues, updating a link, improving some descriptions
1 parent b43e23c commit db1f74c

File tree

1 file changed

+15
-9
lines changed

1 file changed

+15
-9
lines changed

atlas-2025feb-odeo/make_odeo_json.py

Lines changed: 15 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -21,8 +21,12 @@
2121
Open Data for Education and Outreach.
2222
'''
2323

24+
# For working with the metadata records
2425
import json
2526

27+
# For making deep copies of the evergreen data, since we want to change some things
28+
import copy
29+
2630
# Need new recids and DOIs
2731

2832
# Map of skim names into pretty-print descriptions
@@ -78,9 +82,9 @@
7882
skim = 'no' # Fun little hack to fix the English...
7983
name_short = '-'.join(aline.split('_')[2:4]).lower()
8084
if 'Data' in aline:
81-
name = f'Run 2 2015+2016 proton-proton collision data, {skim} skim'
85+
name = f'Run 2 2015+2016 proton-proton collision data beta release, {skim} skim'
8286
else:
83-
name = f'MC simulation, {skim} skim'
87+
name = f'MC simulation, 2015+2016 proton-proton collisions beta release, {skim} skim'
8488
rec_doi = recid_doi_pairs.pop()
8589
dataset_files[ aline.strip() ] = {'name_short':name_short, 'name':name,
8690
'categories':{'source':'ATLAS Collaboration'},'doi':rec_doi[1],'recid':rec_doi[0]}
@@ -135,7 +139,7 @@
135139
},
136140
{
137141
"description": "More about this ntuple format",
138-
"url": "https://opendata.atlas.cern/docs/documentation/data_format/FEB2025_ntuple/"
142+
"url": "https://opendata.atlas.cern/docs/data/for_education/13TeV25_details"
139143
},
140144
{
141145
"description": "Ntuple making framework",
@@ -165,10 +169,10 @@
165169
big_total_events = 0
166170
big_total_size = 0
167171

172+
# Now loop through all the datasets that we are going to publish
168173
for adataset in dataset_files:
169-
my_json = {}
170-
# Update with the stuff that's always good
171-
my_json.update(evergreen_data)
174+
# Start from the stuff that's always good
175+
my_json = copy.deepcopy(evergreen_data)
172176
# Simple abstract for the collection
173177
my_json['abstract'] = {'description':dataset_files[adataset]['name']+' from the ATLAS experiment'}
174178
# Name of the collections, systematically set
@@ -186,7 +190,7 @@
186190
my_json['doi'] = dataset_files[adataset]['doi']
187191
# Update the methodology section with the skim description
188192
skim = adataset.split('_')[2]
189-
my_json['methodology']['description'] += skim_name_map[skim]
193+
my_json['methodology']['description'] = evergreen_data['methodology']['description']+skim_name_map[skim]
190194
# Add a record of the files for this dataset
191195
my_json['files'] = []
192196
# Make list of files for this dataset
@@ -235,13 +239,15 @@
235239
# Update with the stuff that's always good
236240
my_json.update(evergreen_data)
237241
# Simple abstract for the collection
238-
my_json['abstract'] = {'description':'2015 Pb-Pb Open Data for Research from the ATLAS experiment'}
242+
my_json['abstract'] = {'description':'Run 2 2015+2016 proton-proton collision data and corresponding MC simulation Open Data for Education and Outreach from the ATLAS experiment'}
239243
# Name of the collections, systematically set
240244
my_json['collections'] = ['ATLAS-Simulated-Datasets','ATLAS-Primary-Datasets']
241245
my_json['type']['secondary'] = ['Simulated','Collision']
246+
# Description needs a simple update
247+
my_json['methodology']['description'] = evergreen_data['methodology']['description'].replace('the following skimming selection was applied: ','several event pre-selections are available to accelerate analysis, as well as an inclusive set of all events.')
242248
# Add categories, mostly for MC datasets
243249
my_json['categories'] = {'source':'ATLAS Collaboration'}
244-
my_json['title'] = 'ROOT ntuple format 2015-2016 proton-proton Open Data for Education and Outreach from the ATLAS experiment'
250+
my_json['title'] = 'ROOT ntuple format 2015-2016 proton-proton Open Data for Education and Outreach beta release from the ATLAS experiment'
245251
# Add a record ID for CERN Open Data. Reserved range for this release
246252
my_json['recid'] = '93910'
247253
# Add the DOI - these are pre-reserved by the Open Data Portal team

0 commit comments

Comments
 (0)