-
Notifications
You must be signed in to change notification settings - Fork 64
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Add initial version of ccpp_track_variables.py #419
Changes from 33 commits
f2619d9
2f209a5
5715006
4160be2
e9da740
31245e1
83f733f
6cb14c9
0ceb853
a332867
e64dbe3
64dad53
67229d2
36a23e6
5f9e029
5e03756
8ec769d
6c7cfe9
9fa53bb
d64a0fb
c2012ba
08c2027
566e485
9e6b59a
bc6963a
1193e44
c7cc6e4
12d9078
ee99e7e
b8654c4
5f545d7
c27f06f
3f1dd5b
948b620
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,191 @@ | ||
#!/usr/bin/env python3 | ||
|
||
# Standard modules | ||
import os | ||
import argparse | ||
import logging | ||
import glob | ||
|
||
# CCPP framework imports | ||
from metadata_table import find_scheme_names, parse_metadata_file | ||
from ccpp_prebuild import import_config, gather_variable_definitions | ||
from mkstatic import Suite | ||
from parse_checkers import registered_fortran_ddt_names | ||
from parse_tools import init_log, set_log_level | ||
from framework_env import CCPPFrameworkEnv | ||
|
||
############################################################################### | ||
# Set up the command line argument parser and other global variables # | ||
############################################################################### | ||
|
||
############################################################################### | ||
# Functions and subroutines # | ||
############################################################################### | ||
|
||
def parse_arguments(): | ||
"""Parse command line arguments.""" | ||
parser = argparse.ArgumentParser() | ||
parser.add_argument('-s', '--sdf', help='suite definition file to parse', required=True) | ||
parser.add_argument('-m', '--metadata_path', | ||
help='path to CCPP scheme metadata files', required=True) | ||
parser.add_argument('-c', '--config', | ||
help='path to CCPP prebuild configuration file', required=True) | ||
parser.add_argument('-v', '--variable', help='variable to track through CCPP suite', | ||
required=True) | ||
parser.add_argument('--debug', action='store_true', help='enable debugging output', | ||
default=False) | ||
|
||
args = parser.parse_args() | ||
|
||
return(args) | ||
|
||
def setup_logging(debug): | ||
"""Sets up the logging module and logging level.""" | ||
|
||
#Use capgen logging tools | ||
logger = init_log('ccpp_track_variables') | ||
|
||
if debug: | ||
set_log_level(logger, logging.DEBUG) | ||
logger.info('Logging level set to DEBUG') | ||
else: | ||
set_log_level(logger, logging.WARNING) | ||
return logger | ||
|
||
def parse_suite(sdf, run_env): | ||
"""Reads the provided sdf, parses into a Suite data structure, including the "call tree": | ||
the ordered list of schemes for the suite specified by the provided sdf""" | ||
run_env.logger.info(f'Reading sdf {sdf} and populating Suite object') | ||
suite = Suite(sdf_name=sdf) | ||
run_env.logger.info(f'Reading sdf {sdf} and populating Suite object') | ||
success = suite.parse(make_call_tree=True) | ||
if not success: | ||
raise Exception(f'Parsing suite definition file {sdf} failed.') | ||
run_env.logger.info(f'Successfully read sdf {suite.sdf_name}') | ||
return suite | ||
|
||
def create_metadata_filename_dict(metapath): | ||
"""Given a path, read all .meta files in that directory and add them to a dictionary: the keys | ||
are the name of the scheme, and the values are the filename of the .meta file associated | ||
with that scheme""" | ||
|
||
metadata_dict = {} | ||
scheme_filenames = glob.glob(os.path.join(metapath, "*.meta")) | ||
if not scheme_filenames: | ||
raise Exception(f'No files found in {metapath} with ".meta" extension') | ||
|
||
for scheme_fn in scheme_filenames: | ||
schemes = find_scheme_names(scheme_fn) | ||
# The above returns a list of schemes in each filename, but | ||
# we want a dictionary of schemes associated with filenames: | ||
for scheme in schemes: | ||
metadata_dict[scheme] = scheme_fn | ||
|
||
return metadata_dict | ||
|
||
|
||
def create_var_graph(suite, var, config, metapath, run_env): | ||
"""Given a suite, variable name, a 'config' dictionary, and a path to .meta files: | ||
1. Creates a dictionary associating schemes with their .meta files | ||
2. Loops through the call tree of the provided suite | ||
3. For each scheme, reads .meta file for said scheme, checks for variable within that | ||
scheme, and if it exists, adds an entry to a list of tuples, where each tuple includes | ||
the name of the scheme and the intent of the variable within that scheme""" | ||
|
||
# Create a list of tuples that will hold the in/out information for each scheme | ||
var_graph = [] | ||
|
||
run_env.logger.debug(f"reading .meta files in path:\n {metapath}") | ||
metadata_dict=create_metadata_filename_dict(metapath) | ||
|
||
run_env.logger.debug(f"reading metadata files for schemes defined in config file: " | ||
f"{config['scheme_files']}") | ||
|
||
# Loop through call tree, find matching filename for scheme via dictionary schemes_in_files, | ||
# then parse that metadata file to find variable info | ||
partial_matches = {} | ||
for scheme in suite.call_tree: | ||
run_env.logger.debug(f"reading meta file for scheme {scheme} ") | ||
|
||
if scheme in metadata_dict: | ||
scheme_filename = metadata_dict[scheme] | ||
else: | ||
raise Exception(f"Error, scheme '{scheme}' from suite '{suite.sdf_name}' " | ||
f"not found in metadata files in {metapath}") | ||
|
||
run_env.logger.debug(f"reading metadata file {scheme_filename} for scheme {scheme}") | ||
|
||
new_metadata_headers = parse_metadata_file(scheme_filename, | ||
known_ddts=registered_fortran_ddt_names(), run_env=run_env) | ||
for scheme_metadata in new_metadata_headers: | ||
for section in scheme_metadata.sections(): | ||
found_var = [] | ||
intent = '' | ||
for scheme_var in section.variable_list(): | ||
exact_match = False | ||
if var == scheme_var.get_prop_value('standard_name'): | ||
run_env.logger.debug(f"Found variable {var} in scheme {section.title}") | ||
found_var = var | ||
exact_match = True | ||
intent = scheme_var.get_prop_value('intent') | ||
break | ||
scheme_var_standard_name = scheme_var.get_prop_value('standard_name') | ||
if scheme_var_standard_name.find(var) != -1: | ||
run_env.logger.debug(f"{var} matches {scheme_var_standard_name}") | ||
found_var.append(scheme_var_standard_name) | ||
if not found_var: | ||
run_env.logger.debug(f"Did not find variable {var} in scheme {section.title}") | ||
elif exact_match: | ||
run_env.logger.debug(f"Exact match found for variable {var} in scheme {section.title}," | ||
f" intent {intent}") | ||
var_graph.append((section.title,intent)) | ||
else: | ||
run_env.logger.debug(f"Found inexact matches for variable(s) {var} " | ||
f"in scheme {section.title}:\n{found_var}") | ||
partial_matches[section.title] = found_var | ||
if var_graph: | ||
success = True | ||
run_env.logger.debug(f"Successfully generated variable graph for sdf {suite.sdf_name}\n") | ||
else: | ||
success = False | ||
run_env.logger.error(f"Variable {var} not found in any suites for sdf {suite.sdf_name}\n") | ||
if partial_matches: | ||
print("Did find partial matches that may be of interest:\n") | ||
for key in partial_matches: | ||
print(f"In {key} found variable(s) {partial_matches[key]}") | ||
|
||
return (success,var_graph) | ||
|
||
def main(): | ||
"""Main routine that traverses a CCPP suite and outputs the list of schemes that use given variable""" | ||
|
||
args = parse_arguments() | ||
|
||
logger = setup_logging(args.debug) | ||
|
||
#Use new capgen class CCPPFrameworkEnv | ||
run_env = CCPPFrameworkEnv(logger, host_files="", scheme_files="", suites="") | ||
|
||
suite = parse_suite(args.sdf,run_env) | ||
|
||
(success, config) = import_config(args.config, None) | ||
if not success: | ||
raise Exception('Call to import_config failed.') | ||
|
||
# Variables defined by the host model; this call is necessary because it converts some old | ||
# metadata formats so they can be used later in the script | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. I looked at |
||
(success, _, _) = gather_variable_definitions(config['variable_definition_files'], | ||
config['typedefs_new_metadata']) | ||
if not success: | ||
raise Exception('Call to gather_variable_definitions failed.') | ||
|
||
(success, var_graph) = create_var_graph(suite, args.variable, config, args.metadata_path, run_env) | ||
if success: | ||
print(f"For suite {suite.sdf_name}, the following schemes (in order) " | ||
f"use the variable {args.variable}:") | ||
for entry in var_graph: | ||
print(f"{entry[0]} (intent {entry[1]})") | ||
|
||
|
||
if __name__ == '__main__': | ||
main() |
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Do you have examples of partial matches? How does tracking them help?
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
This case is for when a user inputs something like "latent_heat" as their variable, which matches multiple standard names (e.g.
latent_heat_of_vaporization_of_water_at_0c
,surface_upward_potential_latent_heat_flux
, etc.). This makes it easier for users who might not know the exact standard name of the variable they are looking for, or for something like, for example, any variable containing the word "temperature".The final section in my PR message ("Partial match for variable") gives an example of this.