Skip to content

Commit fd9286e

Browse files
Add energy domain value sets with SWEET ontology mappings
New value sets for DOE Genesis Mission energy domains: - Geothermal: system types, reservoir types, well types, applications, temperature classification - Hydrogen: color classification (green, blue, grey, etc.), production methods, storage, applications - Bioenergy: feedstock types, biofuel types, generation classification, bioconversion processes Enhanced existing schemas: - energy.yaml: Added SWEET mappings and CapabilityStatus enum for facility lifecycle - structural_biology.yaml: Added ontology mappings (CHMO, MOD, MI, FBbi, EDAM) Mapping predicates used intentionally: - exact_mappings: Exactly equivalent concepts - close_mappings: Nearly equivalent (e.g., ETHANOL→sweet:matrEnergy/Ethanol) - broad_mappings: Target is more general (e.g., HYDROGEN fuel→sweet:matrElement/Hydrogen) - narrow_mappings: Target is more specific - related_mappings: Conceptually related but different aspect Added enum-report script for generating CSV mapping statistics. 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude <noreply@anthropic.com>
1 parent 1f21cae commit fd9286e

File tree

19 files changed

+5043
-147
lines changed

19 files changed

+5043
-147
lines changed

docs/schema/valuesets.yaml

Lines changed: 1812 additions & 23 deletions
Large diffs are not rendered by default.

justfile

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -368,6 +368,12 @@ uniprot-stats:
368368
echo "Current YAML: [not found]"; \
369369
fi
370370

371+
# Generate CSV report of all enums with mapping statistics
372+
[group('reports')]
373+
enum-report:
374+
uv run python scripts/generate_enum_report.py
375+
@echo "Report saved to enum_report.csv"
376+
371377
# ============== Include project-specific recipes ==============
372378

373379
import "python.justfile"

project/jsonschema/valuesets.schema.json

Lines changed: 242 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -223,6 +223,31 @@
223223
"title": "AnatomicalAxis",
224224
"type": "string"
225225
},
226+
"AnatomicalOrientation": {
227+
"description": "Directional orientation between anatomical positions based on OME NGFF specification",
228+
"enum": [
229+
"LEFT_TO_RIGHT",
230+
"RIGHT_TO_LEFT",
231+
"ANTERIOR_TO_POSTERIOR",
232+
"POSTERIOR_TO_ANTERIOR",
233+
"INFERIOR_TO_SUPERIOR",
234+
"SUPERIOR_TO_INFERIOR",
235+
"DORSAL_TO_VENTRAL",
236+
"VENTRAL_TO_DORSAL",
237+
"DORSAL_TO_PALMAR",
238+
"PALMAR_TO_DORSAL",
239+
"DORSAL_TO_PLANTAR",
240+
"PLANTAR_TO_DORSAL",
241+
"ROSTRAL_TO_CAUDAL",
242+
"CAUDAL_TO_ROSTRAL",
243+
"CRANIAL_TO_CAUDAL",
244+
"CAUDAL_TO_CRANIAL",
245+
"PROXIMAL_TO_DISTAL",
246+
"DISTAL_TO_PROXIMAL"
247+
],
248+
"title": "AnatomicalOrientation",
249+
"type": "string"
250+
},
226251
"AnatomicalPlane": {
227252
"description": "Standard anatomical planes for sectioning",
228253
"enum": [
@@ -528,6 +553,53 @@
528553
"title": "BinaryClassificationEnum",
529554
"type": "string"
530555
},
556+
"BioconversionProcess": {
557+
"description": "Processes for converting biomass feedstocks into biofuels and bioproducts.",
558+
"enum": [
559+
"FERMENTATION",
560+
"ANAEROBIC_DIGESTION",
561+
"TRANSESTERIFICATION",
562+
"HYDROTREATING",
563+
"PYROLYSIS",
564+
"GASIFICATION",
565+
"HYDROTHERMAL_LIQUEFACTION",
566+
"ENZYMATIC_HYDROLYSIS",
567+
"ACID_HYDROLYSIS",
568+
"FISCHER_TROPSCH",
569+
"ALCOHOL_TO_JET"
570+
],
571+
"title": "BioconversionProcess",
572+
"type": "string"
573+
},
574+
"BiofuelGeneration": {
575+
"description": "Classification of biofuels by feedstock source and technology generation.",
576+
"enum": [
577+
"FIRST_GENERATION",
578+
"SECOND_GENERATION",
579+
"THIRD_GENERATION",
580+
"FOURTH_GENERATION"
581+
],
582+
"title": "BiofuelGeneration",
583+
"type": "string"
584+
},
585+
"BiofuelType": {
586+
"description": "Types of fuels produced from biomass feedstocks.",
587+
"enum": [
588+
"ETHANOL",
589+
"BIODIESEL",
590+
"RENEWABLE_DIESEL",
591+
"SUSTAINABLE_AVIATION_FUEL",
592+
"BIOGAS",
593+
"BIOMETHANE",
594+
"BIO_OIL",
595+
"SYNGAS",
596+
"BUTANOL",
597+
"METHANOL",
598+
"DIMETHYL_ETHER"
599+
],
600+
"title": "BiofuelType",
601+
"type": "string"
602+
},
531603
"BioleachMode": {
532604
"description": "Mechanisms of bioleaching including indirect and direct bacterial action.",
533605
"enum": [
@@ -598,6 +670,32 @@
598670
"title": "BiologicalSexEnum",
599671
"type": "string"
600672
},
673+
"BiomassFeedstockType": {
674+
"description": "Types of biomass materials used as feedstocks for bioenergy production. Includes dedicated energy crops, agricultural residues, forest residues, and waste streams.",
675+
"enum": [
676+
"CORN_STOVER",
677+
"WHEAT_STRAW",
678+
"RICE_STRAW",
679+
"SWITCHGRASS",
680+
"MISCANTHUS",
681+
"ENERGY_CANE",
682+
"SWEET_SORGHUM",
683+
"POPLAR",
684+
"WILLOW",
685+
"FOREST_RESIDUE",
686+
"WOOD_PROCESSING_RESIDUE",
687+
"MUNICIPAL_SOLID_WASTE",
688+
"FOOD_WASTE",
689+
"ANIMAL_MANURE",
690+
"ALGAE",
691+
"USED_COOKING_OIL",
692+
"SOYBEAN_OIL",
693+
"CORN_GRAIN",
694+
"SUGARCANE"
695+
],
696+
"title": "BiomassFeedstockType",
697+
"type": "string"
698+
},
601699
"BioreactorTypeEnum": {
602700
"description": "Types of bioreactors used in fermentation and cell culture",
603701
"enum": [
@@ -897,6 +995,18 @@
897995
"title": "CapabilityMaturityLevel",
898996
"type": "string"
899997
},
998+
"CapabilityStatus": {
999+
"description": "Operational status of a capability, facility, or infrastructure. Applicable to energy facilities, research capabilities, and other infrastructure throughout their lifecycle.",
1000+
"enum": [
1001+
"OPERATIONAL",
1002+
"COMING_ONLINE",
1003+
"PILOT",
1004+
"UNDER_DEVELOPMENT",
1005+
"DECOMMISSIONED"
1006+
],
1007+
"title": "CapabilityStatus",
1008+
"type": "string"
1009+
},
9001010
"CarbonIntensity": {
9011011
"description": "Carbon intensity levels for energy sources",
9021012
"enum": [
@@ -3307,6 +3417,72 @@
33073417
"title": "GeologicalEra",
33083418
"type": "string"
33093419
},
3420+
"GeothermalApplication": {
3421+
"description": "Applications and uses of geothermal energy.",
3422+
"enum": [
3423+
"ELECTRICITY_GENERATION",
3424+
"DIRECT_USE_HEATING",
3425+
"GREENHOUSE_HEATING",
3426+
"AQUACULTURE",
3427+
"INDUSTRIAL_PROCESS_HEAT",
3428+
"FOOD_PROCESSING",
3429+
"BATHING_RECREATION",
3430+
"LITHIUM_EXTRACTION"
3431+
],
3432+
"title": "GeothermalApplication",
3433+
"type": "string"
3434+
},
3435+
"GeothermalReservoirType": {
3436+
"description": "Classification of geothermal reservoirs by geological setting and characteristics.",
3437+
"enum": [
3438+
"VOLCANIC",
3439+
"SEDIMENTARY",
3440+
"FRACTURED_BASEMENT",
3441+
"FAULT_CONTROLLED",
3442+
"MAGMATIC",
3443+
"CONDUCTION_DOMINATED"
3444+
],
3445+
"title": "GeothermalReservoirType",
3446+
"type": "string"
3447+
},
3448+
"GeothermalResourceTemperature": {
3449+
"description": "Classification of geothermal resources by temperature range.",
3450+
"enum": [
3451+
"LOW_TEMPERATURE",
3452+
"MODERATE_TEMPERATURE",
3453+
"HIGH_TEMPERATURE",
3454+
"SUPERCRITICAL"
3455+
],
3456+
"title": "GeothermalResourceTemperature",
3457+
"type": "string"
3458+
},
3459+
"GeothermalSystemType": {
3460+
"description": "Types of geothermal energy systems, including conventional hydrothermal and enhanced/engineered geothermal systems.",
3461+
"enum": [
3462+
"HYDROTHERMAL",
3463+
"ENHANCED_GEOTHERMAL_SYSTEM",
3464+
"ADVANCED_GEOTHERMAL_SYSTEM",
3465+
"HOT_DRY_ROCK",
3466+
"GEOPRESSURED",
3467+
"SUPERCRITICAL",
3468+
"GROUND_SOURCE_HEAT_PUMP"
3469+
],
3470+
"title": "GeothermalSystemType",
3471+
"type": "string"
3472+
},
3473+
"GeothermalWellType": {
3474+
"description": "Types of wells used in geothermal energy development and production.",
3475+
"enum": [
3476+
"PRODUCTION_WELL",
3477+
"INJECTION_WELL",
3478+
"EXPLORATION_WELL",
3479+
"OBSERVATION_WELL",
3480+
"SLIM_HOLE",
3481+
"DIRECTIONAL_WELL"
3482+
],
3483+
"title": "GeothermalWellType",
3484+
"type": "string"
3485+
},
33103486
"GridType": {
33113487
"description": "Types of electrical grid systems",
33123488
"enum": [
@@ -3479,6 +3655,72 @@
34793655
"title": "HumanDevelopmentalStage",
34803656
"type": "string"
34813657
},
3658+
"HydrogenApplication": {
3659+
"description": "End-use applications for hydrogen.",
3660+
"enum": [
3661+
"FUEL_CELL_VEHICLE",
3662+
"FUEL_CELL_STATIONARY",
3663+
"INDUSTRIAL_FEEDSTOCK",
3664+
"STEEL_PRODUCTION",
3665+
"AMMONIA_SYNTHESIS",
3666+
"METHANOL_SYNTHESIS",
3667+
"POWER_TO_GAS",
3668+
"BLENDING_NATURAL_GAS",
3669+
"SYNTHETIC_FUELS"
3670+
],
3671+
"title": "HydrogenApplication",
3672+
"type": "string"
3673+
},
3674+
"HydrogenProductionMethod": {
3675+
"description": "Methods and processes for producing hydrogen.",
3676+
"enum": [
3677+
"STEAM_METHANE_REFORMING",
3678+
"AUTOTHERMAL_REFORMING",
3679+
"PARTIAL_OXIDATION",
3680+
"COAL_GASIFICATION",
3681+
"WATER_ELECTROLYSIS",
3682+
"ALKALINE_ELECTROLYSIS",
3683+
"PEM_ELECTROLYSIS",
3684+
"SOLID_OXIDE_ELECTROLYSIS",
3685+
"METHANE_PYROLYSIS",
3686+
"BIOMASS_GASIFICATION",
3687+
"BIOLOGICAL_PRODUCTION",
3688+
"THERMOCHEMICAL_WATER_SPLITTING",
3689+
"PHOTOELECTROCHEMICAL"
3690+
],
3691+
"title": "HydrogenProductionMethod",
3692+
"type": "string"
3693+
},
3694+
"HydrogenStorageMethod": {
3695+
"description": "Methods for storing hydrogen for later use or transport.",
3696+
"enum": [
3697+
"COMPRESSED_GAS",
3698+
"LIQUID_HYDROGEN",
3699+
"METAL_HYDRIDE",
3700+
"CHEMICAL_HYDRIDE",
3701+
"UNDERGROUND_STORAGE",
3702+
"CRYO_COMPRESSED"
3703+
],
3704+
"title": "HydrogenStorageMethod",
3705+
"type": "string"
3706+
},
3707+
"HydrogenType": {
3708+
"description": "Color-coded classification of hydrogen based on production method and carbon intensity. This informal industry taxonomy differentiates hydrogen by its carbon footprint and energy source.",
3709+
"enum": [
3710+
"GREEN_HYDROGEN",
3711+
"BLUE_HYDROGEN",
3712+
"GREY_HYDROGEN",
3713+
"BROWN_HYDROGEN",
3714+
"BLACK_HYDROGEN",
3715+
"PINK_HYDROGEN",
3716+
"TURQUOISE_HYDROGEN",
3717+
"WHITE_HYDROGEN",
3718+
"YELLOW_HYDROGEN",
3719+
"ORANGE_HYDROGEN"
3720+
],
3721+
"title": "HydrogenType",
3722+
"type": "string"
3723+
},
34823724
"IAEAWasteClassificationEnum": {
34833725
"description": "IAEA General Safety Requirements radioactive waste classification scheme",
34843726
"enum": [

0 commit comments

Comments
 (0)