Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Consolidate python configuration dictionaries #2839

Merged
Merged
Show file tree
Hide file tree
Changes from 5 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
106 changes: 51 additions & 55 deletions workflow/applications/applications.py
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,6 @@
from typing import Dict, List, Any
from datetime import timedelta
from hosts import Host
from pathlib import Path
from wxflow import Configuration, to_timedelta
from abc import ABC, ABCMeta, abstractmethod

Expand Down Expand Up @@ -32,57 +31,50 @@ def __init__(self, conf: Configuration) -> None:

self.scheduler = Host().scheduler

# Save the configuration so we can source the config files when
# determining task resources
self.conf = conf
self._base = conf.parse_config('config.base')
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Don't like making this an object field. This version should not be needed beyond initialization. All later uses should be using self.configs[run]['base'].

Suggested change
self._base = conf.parse_config('config.base')
base = conf.parse_config('config.base')

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Alright, I removed the _base attribute from the AppConfig class and subclasses. _no_run is no longer referenced anywhere outside of _init_finalize. This is still required to determine which runs are valid for the experiment.


_base = self.conf.parse_config('config.base')
# Define here so the child __init__ functions can use it; will
# be overwritten later during _init_finalize().
self._base = _base

self.mode = _base['MODE']
self.mode = self._base['MODE']

if self.mode not in self.VALID_MODES:
raise NotImplementedError(f'{self.mode} is not a valid application mode.\n' +
'Valid application modes are:\n' +
f'{", ".join(self.VALID_MODES)}')

self.net = _base['NET']
self.model_app = _base.get('APP', 'ATM')
self.do_atm = _base.get('DO_ATM', True)
self.do_wave = _base.get('DO_WAVE', False)
self.do_wave_bnd = _base.get('DOBNDPNT_WAVE', False)
self.do_ocean = _base.get('DO_OCN', False)
self.do_ice = _base.get('DO_ICE', False)
self.do_aero = _base.get('DO_AERO', False)
self.do_prep_obs_aero = _base.get('DO_PREP_OBS_AERO', False)
self.do_bufrsnd = _base.get('DO_BUFRSND', False)
self.do_gempak = _base.get('DO_GEMPAK', False)
self.do_awips = _base.get('DO_AWIPS', False)
self.do_verfozn = _base.get('DO_VERFOZN', True)
self.do_verfrad = _base.get('DO_VERFRAD', True)
self.do_vminmon = _base.get('DO_VMINMON', True)
self.do_tracker = _base.get('DO_TRACKER', True)
self.do_genesis = _base.get('DO_GENESIS', True)
self.do_genesis_fsu = _base.get('DO_GENESIS_FSU', False)
self.do_metp = _base.get('DO_METP', False)
self.do_upp = not _base.get('WRITE_DOPOST', True)
self.do_goes = _base.get('DO_GOES', False)
self.do_mos = _base.get('DO_MOS', False)
self.do_extractvars = _base.get('DO_EXTRACTVARS', False)

self.do_hpssarch = _base.get('HPSSARCH', False)

self.nens = _base.get('NMEM_ENS', 0)
self.fcst_segments = _base.get('FCST_SEGMENTS', None)
raise NotImplementedError(f'{self.mode} is not a valid application mode.\n'
f'Valid application modes are:\n'
f'{", ".join(self.VALID_MODES)}\n')

self.net = self._base['NET']
self.model_app = self._base.get('APP', 'ATM')
self.do_atm = self._base.get('DO_ATM', True)
self.do_wave = self._base.get('DO_WAVE', False)
self.do_wave_bnd = self._base.get('DOBNDPNT_WAVE', False)
self.do_ocean = self._base.get('DO_OCN', False)
self.do_ice = self._base.get('DO_ICE', False)
self.do_aero = self._base.get('DO_AERO', False)
self.do_prep_obs_aero = self._base.get('DO_PREP_OBS_AERO', False)
self.do_bufrsnd = self._base.get('DO_BUFRSND', False)
self.do_gempak = self._base.get('DO_GEMPAK', False)
self.do_awips = self._base.get('DO_AWIPS', False)
self.do_verfozn = self._base.get('DO_VERFOZN', True)
self.do_verfrad = self._base.get('DO_VERFRAD', True)
self.do_vminmon = self._base.get('DO_VMINMON', True)
self.do_tracker = self._base.get('DO_TRACKER', True)
self.do_genesis = self._base.get('DO_GENESIS', True)
self.do_genesis_fsu = self._base.get('DO_GENESIS_FSU', False)
self.do_metp = self._base.get('DO_METP', False)
self.do_upp = not self._base.get('WRITE_DOPOST', True)
self.do_goes = self._base.get('DO_GOES', False)
self.do_mos = self._base.get('DO_MOS', False)
self.do_extractvars = self._base.get('DO_EXTRACTVARS', False)

self.do_hpssarch = self._base.get('HPSSARCH', False)

self.nens = self._base.get('NMEM_ENS', 0)
self.fcst_segments = self._base.get('FCST_SEGMENTS', None)

if not AppConfig.is_monotonic(self.fcst_segments):
raise ValueError(f'Forecast segments do not increase monotonically: {",".join(self.fcst_segments)}')

self.wave_runs = None
if self.do_wave:
wave_run = _base.get('WAVE_RUN', 'BOTH').lower()
wave_run = self._base.get('WAVE_RUN', 'BOTH').lower()
if wave_run in ['both']:
self.wave_runs = ['gfs', 'gdas']
elif wave_run in ['gfs', 'gdas']:
Expand All @@ -91,45 +83,49 @@ def __init__(self, conf: Configuration) -> None:
self.aero_anl_runs = None
self.aero_fcst_runs = None
if self.do_aero:
aero_anl_run = _base.get('AERO_ANL_RUN', 'BOTH').lower()
aero_anl_run = self._base.get('AERO_ANL_RUN', 'BOTH').lower()
if aero_anl_run in ['both']:
self.aero_anl_runs = ['gfs', 'gdas']
elif aero_anl_run in ['gfs', 'gdas']:
self.aero_anl_runs = [aero_anl_run]
aero_fcst_run = _base.get('AERO_FCST_RUN', None).lower()
aero_fcst_run = self._base.get('AERO_FCST_RUN', None).lower()
if aero_fcst_run in ['both']:
self.aero_fcst_runs = ['gfs', 'gdas']
elif aero_fcst_run in ['gfs', 'gdas']:
self.aero_fcst_runs = [aero_fcst_run]

def _init_finalize(self, *args):
def _init_finalize(self, conf: Configuration):
print("Finalizing initialize")

# Get a list of all possible config_files that would be part of the application
self.configs_names = self._get_app_configs()

# Source the config_files for the jobs in the application
self.configs = self.source_configs()
# Source the config files for the jobs in the application without specifying a RUN
self.configs = {'_no_run': self._source_configs(conf)}
WalterKolczynski-NOAA marked this conversation as resolved.
Show resolved Hide resolved

# Update the base config dictionary base on application
self.configs['base'] = self.update_base(self.configs['base'])
self.configs['_no_run']['base'] = self._update_base(self.configs['_no_run']['base'])

# Save base in the internal state since it is often needed
self._base = self.configs['base']
self._base = self.configs['_no_run']['base']

# Get more configuration options into the class attributes
self.gfs_cyc = self._base.get('gfs_cyc')

# Finally get task names for the application
# Get task names for the application
self.task_names = self.get_task_names()

# Finally, source the configuration files for each valid `RUN`
for run in self.task_names.keys():
self.configs[run] = self._source_configs(conf, run=run, log=False)

@abstractmethod
def _get_app_configs(self):
pass

@staticmethod
@abstractmethod
def update_base(base_in: Dict[str, Any]) -> Dict[str, Any]:
def _update_base(base_in: Dict[str, Any]) -> Dict[str, Any]:
'''
Make final updates to base and return an updated copy

Expand All @@ -146,7 +142,7 @@ def update_base(base_in: Dict[str, Any]) -> Dict[str, Any]:
'''
pass

def source_configs(self, run: str = "gfs", log: bool = True) -> Dict[str, Any]:
def _source_configs(self, conf: Configuration, run: str = "gfs", log: bool = True) -> Dict[str, Any]:
"""
Given the configuration object used to initialize this application,
source the configurations for each config and return a dictionary
Expand All @@ -156,7 +152,7 @@ def source_configs(self, run: str = "gfs", log: bool = True) -> Dict[str, Any]:
configs = dict()

# Return config.base as well
configs['base'] = self.conf.parse_config('config.base')
configs['base'] = conf.parse_config('config.base')
WalterKolczynski-NOAA marked this conversation as resolved.
Show resolved Hide resolved

# Source the list of all config_files involved in the application
for config in self.configs_names:
Expand All @@ -180,7 +176,7 @@ def source_configs(self, run: str = "gfs", log: bool = True) -> Dict[str, Any]:
files += [f'config.{config}']

print(f'sourcing config.{config}') if log else 0
configs[config] = self.conf.parse_config(files, RUN=run)
configs[config] = conf.parse_config(files, RUN=run)

return configs

Expand Down
2 changes: 1 addition & 1 deletion workflow/applications/gefs.py
Original file line number Diff line number Diff line change
Expand Up @@ -36,7 +36,7 @@ def _get_app_configs(self):
return configs

@staticmethod
def update_base(base_in):
def _update_base(base_in):

base_out = base_in.copy()
base_out['INTERVAL_GFS'] = AppConfig.get_gfs_interval(base_in['gfs_cyc'])
Expand Down
2 changes: 1 addition & 1 deletion workflow/applications/gfs_cycled.py
Original file line number Diff line number Diff line change
Expand Up @@ -123,7 +123,7 @@ def _get_app_configs(self):
return configs

@staticmethod
def update_base(base_in):
def _update_base(base_in):

return GFSCycledAppConfig.get_gfs_cyc_dates(base_in)

Expand Down
3 changes: 1 addition & 2 deletions workflow/applications/gfs_forecast_only.py
Original file line number Diff line number Diff line change
Expand Up @@ -70,11 +70,10 @@ def _get_app_configs(self):
return configs

@staticmethod
def update_base(base_in):
def _update_base(base_in):

base_out = base_in.copy()
base_out['INTERVAL_GFS'] = AppConfig.get_gfs_interval(base_in['gfs_cyc'])
base_out['RUN'] = 'gfs'

return base_out

Expand Down
15 changes: 7 additions & 8 deletions workflow/rocoto/tasks.py
Original file line number Diff line number Diff line change
@@ -1,6 +1,5 @@
#!/usr/bin/env python3

import copy
import numpy as np
from applications.applications import AppConfig
import rocoto.rocoto as rocoto
Expand Down Expand Up @@ -39,15 +38,16 @@ class Tasks:

def __init__(self, app_config: AppConfig, run: str) -> None:

self.app_config = copy.deepcopy(app_config)
self.app_config = app_config
self.run = run
# Re-source the configs with RUN specified
print(f"Source configs with RUN={run}")
self._configs = self.app_config.source_configs(run=run, log=False)

# Get the configs for the specified RUN
self._configs = self.app_config.configs[run]

# Update the base config for the application
self._configs['base'] = self.app_config.update_base(self._configs['base'])
# Save dict_configs and base in the internal state (never know where it may be needed)
self._configs['base'] = self.app_config._update_base(self._configs['base'])
WalterKolczynski-NOAA marked this conversation as resolved.
Show resolved Hide resolved

# Save base in the internal state (never know where it may be needed)
self._base = self._configs['base']

self.HOMEgfs = self._base['HOMEgfs']
Expand Down Expand Up @@ -134,7 +134,6 @@ def _template_to_rocoto_cycstring(self, template: str, subs_dict: dict = {}) ->
def _get_forecast_hours(run, config, component='atmos') -> List[str]:
# Make a local copy of the config to avoid modifying the original
local_config = config.copy()

# Ocean/Ice components do not have a HF output option like the atmosphere
if component in ['ocean', 'ice']:
local_config['FHMAX_HF_GFS'] = 0
Expand Down
3 changes: 2 additions & 1 deletion workflow/rocoto/workflow_xml.py
Original file line number Diff line number Diff line change
Expand Up @@ -18,7 +18,8 @@ def __init__(self, app_config: AppConfig, rocoto_config: Dict) -> None:
self._app_config = app_config
self.rocoto_config = rocoto_config

self._base = self._app_config.configs['base']
# Use the generic config.base (without RUN specified)
self._base = self._app_config.configs['_no_run']['base']

self.preamble = self._get_preamble()
self.definitions = self._get_definitions()
Expand Down
Loading