From 2c492f88ad9cead81bd3be1c14f64d2eab59cf4f Mon Sep 17 00:00:00 2001 From: Bob Yantosca Date: Tue, 25 Jul 2023 10:31:07 -0400 Subject: [PATCH 1/7] Ensure closest grid box indices to stations are returned as integers benchmark/modules/benchmark_models_vs_obs.py - Convert longitudes and latitudes from xarray.DataArray to numpy.ndarray before computing x_idx and y_idx. This will ensure that x_idx and y_idx are returned as numpy.int64 values. NOTE: There is an issue with the search algorithm for GCHP data. We will rectify this soon. Signed-off-by: Bob Yantosca --- benchmark/modules/benchmark_models_vs_obs.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/benchmark/modules/benchmark_models_vs_obs.py b/benchmark/modules/benchmark_models_vs_obs.py index bd9149db..531069f2 100644 --- a/benchmark/modules/benchmark_models_vs_obs.py +++ b/benchmark/modules/benchmark_models_vs_obs.py @@ -348,20 +348,20 @@ def find_nearest_3d( Returns: -------- - x_idx, y_idx, z_idx + x_idx, y_idx, z_idx : numpy.int64 GEOS-Chem grid box indices for the single gridbox closest to GAW site specifications """ x_idx=( np.abs( - gc_data.lon - float(lon_value) + gc_data.lon.values - float(lon_value) ) ).argmin() y_idx=( np.abs( - gc_data.lat - float(lat_value) + gc_data.lat.values - float(lat_value) ) ).argmin() From 2a5451deb350b3383231912bd0459cbb6b9d04ab Mon Sep 17 00:00:00 2001 From: Bob Yantosca Date: Tue, 25 Jul 2023 10:32:59 -0400 Subject: [PATCH 2/7] Change models vs. obs. plots directory name to "ModelVsObs" benchmark/modules/run_1yr_fullchem_benchmark.py - gcc_vs_gcc_models_vs_obs_dir, gchp_vs_gcc_models_vs_obs_dir, and gchp_vs_gchp_models_vs_obs_dir now use directory name "ModelVsObs" instead of "Models_vs_Observations". Signed-off-by: Bob Yantosca --- benchmark/modules/run_1yr_fullchem_benchmark.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/benchmark/modules/run_1yr_fullchem_benchmark.py b/benchmark/modules/run_1yr_fullchem_benchmark.py index 8ab729e0..06d68eb2 100755 --- a/benchmark/modules/run_1yr_fullchem_benchmark.py +++ b/benchmark/modules/run_1yr_fullchem_benchmark.py @@ -229,13 +229,13 @@ def run_benchmark(config, bmk_year_ref, bmk_year_dev): # Models vs. observations directories gcc_vs_gcc_models_vs_obs_dir = os.path.join( - gcc_vs_gcc_resultsdir, "Models_vs_Observations" + gcc_vs_gcc_resultsdir, "ModelVsObs" ) gchp_vs_gcc_models_vs_obs_dir = os.path.join( - gchp_vs_gcc_resultsdir, "Models_vs_Observations" + gchp_vs_gcc_resultsdir, "ModelVsObs" ) gchp_vs_gchp_models_vs_obs_dir = os.path.join( - gchp_vs_gchp_resultsdir, "Models_vs_Observations" + gchp_vs_gchp_resultsdir, "ModelVsObs" ) # ====================================================================== From 6a7f52bd6f9716a5416aa33d9bb1b0f5cf6db64a Mon Sep 17 00:00:00 2001 From: Bob Yantosca Date: Thu, 27 Jul 2023 10:27:23 -0400 Subject: [PATCH 3/7] Add verify_variable_type function to util.py gcpy/util.py - Added utility function verify_variable_type. This will return a TypeError if a variable is not of the expected type or types that are provided. Useful for function argument error checking. Signed-off-by: Bob Yantosca --- gcpy/util.py | 31 +++++++++++++++++++++++++++++++ 1 file changed, 31 insertions(+) diff --git a/gcpy/util.py b/gcpy/util.py index 95265b32..cdb39747 100644 --- a/gcpy/util.py +++ b/gcpy/util.py @@ -2425,3 +2425,34 @@ def trim_cloud_benchmark_label( label.replace(v, "") return label + + +def verify_variable_type( + var, + var_type +): + """ + Convenience routine that will raise a TypeError if a variable's + type does not match a list of expected types. + + Args: + ----- + var : variable of any type + The variable to check. + + var_type : type or list of types + A single type definition (list, str, pandas.Series, etc.) + or a list of type definitions. + """ + + # var_type is a list of types + if isinstance(var_type, list): + for the_type in var_type: + if isinstance(var, the_type): + return + raise TypeError( f"{var} is not of type: {var_type}!") + + # var_type is a single type + if isinstance(var, var_type): + return + raise TypeError( f"{var} is not of type: {var_type}!") From f502064336730091867ced4415b0656857610840 Mon Sep 17 00:00:00 2001 From: Bob Yantosca Date: Thu, 27 Jul 2023 10:54:44 -0400 Subject: [PATCH 4/7] Pass tuples instead of lists to verify_variable_type gcpy/util.py - Function verify_variable_type now accepts a single type or a tuple of types. These are the allowable types to be passed to isinstance. gcpy/cstools.py - Convert lists of types to tuples in function calls to verify_variable_type - Also remove src_var argument in extract_grid function Signed-off-by: Bob Yantosca --- gcpy/cstools.py | 64 ++++++++++++++++++++++++++++++++++++++++--------- gcpy/util.py | 11 ++------- 2 files changed, 55 insertions(+), 20 deletions(-) diff --git a/gcpy/cstools.py b/gcpy/cstools.py index 0ef94124..8acced36 100644 --- a/gcpy/cstools.py +++ b/gcpy/cstools.py @@ -48,24 +48,28 @@ def extract_grid( - data, - src_var='Xdim' + data ): """ Extracts the grid information from an xarray.Dataset object and - returns a new xarray.Dataset object on a cubed-sphere grid. + returns the grid information as a cubed-sphere xarray.Dataset. Args: ----- - data : xarray.Dataset + data : xarray.Dataset or xarray.DataArray The input dataset - data_cs: xarray.Dataset + data_cs: xarray.Dataset or None Same data as in argument "ds", but on a cubed-sphere grid + If the data is not placed on a cubed-sphere grid, then + this will be returned with the value None. """ - if not isinstance(data, xr.Dataset): - return TypeError("Argument 'ds' is not of type 'xarray.Dataset'!") - n_cs = data[src_var].shape[-1] + gcpy.util.verify_variable_type(data, (xr.DataArray, xr.Dataset)) + + if not is_cubed_sphere(data): + return None + + n_cs = data["Xdim"].shape[-1] return gen_grid(n_cs) @@ -316,6 +320,7 @@ def gen_grid( stretched grid. Args: + ----- n_cs : int Number of grid boxes along a single face of the cubed-sphere. @@ -326,6 +331,16 @@ def gen_grid( Specifies the longitude and latitude at the center of the cubed-sphere grid face that will be stretched. Default values: None, None + + Returns: + -------- + grid : xarray.Dataset + Cubed-sphere grid definition containing the variables: + {'lat' : lat midpoints, + 'lon' : lon midpoints, + 'lat_b' : lat edges, + 'lon_b' : lon edges} + where each value has an extra face dimension of length 6. """ if stretch_factor is not None: cs_temp, ignore = gcpy.make_grid_SG( @@ -578,15 +593,14 @@ def find_index( Latitude and longitude (degrees) of the point for which cubed-sphere indices are desired. - grid : dict - Cubed-sphere grid definition as a dict of: + grid : xarray.Dataset + Cubed-sphere grid definition with the following variables: {'lat' : lat midpoints, 'lon' : lon midpoints, 'lat_b' : lat edges, 'lon_b' : lon edges} where each value has an extra face dimension of length 6. - Returns: -------- ind : numpy.ndarray @@ -595,6 +609,8 @@ def find_index( YDim is the cubed-sphere longitude index at (lat, lon) XDim is the cubed-sphere latitude index at (lat, lon) """ + gcpy.util.verify_variable_type(grid, xr.Dataset) + lon_vec = np.asarray(lon) lat_vec = np.asarray(lat) n_find = lon_vec.size @@ -638,3 +654,29 @@ def find_index( idx[:,i_find] = [nf_cs, ydim_cs, xdim_cs] return idx + + +def is_cubed_sphere( + data +): + """ + Given an xarray Dataset or DataArray object, determines if the + data is placed on a cubed-sphere grid + + Args: + ----- + data : xarray.Dataset or xarray.DataArray + The input data to be tested + + Returns: + -------- + is_gchp : bool + Returns True if data is placed on a cubed-sphere grid, + and False otherwise. + """ + gcpy.util.verify_variable_type(data, (xr.DataArray, xr.Dataset)) + + if "nf" in data.dims: # nf = number of cubed-sphere faces + return True + + return False diff --git a/gcpy/util.py b/gcpy/util.py index cdb39747..e4311d6b 100644 --- a/gcpy/util.py +++ b/gcpy/util.py @@ -2440,19 +2440,12 @@ def verify_variable_type( var : variable of any type The variable to check. - var_type : type or list of types + var_type : type or tuple of types A single type definition (list, str, pandas.Series, etc.) - or a list of type definitions. + or a tuple of type definitions. """ # var_type is a list of types - if isinstance(var_type, list): - for the_type in var_type: - if isinstance(var, the_type): - return - raise TypeError( f"{var} is not of type: {var_type}!") - - # var_type is a single type if isinstance(var, var_type): return raise TypeError( f"{var} is not of type: {var_type}!") From 31fc535eefbdd1a0afaf6182bb43ab9310db9782 Mon Sep 17 00:00:00 2001 From: Bob Yantosca Date: Thu, 27 Jul 2023 12:34:48 -0400 Subject: [PATCH 5/7] Use cstools functions in benchmark_models_vs_obs.py benchmark_models_vs_obs.py - Now use verify_variable_type to error check function arguments - Replaced find_nearest_3d function with separate functions for returning the model data nearest to the observation site for cubed-sphere and lat-lon grids - Updated PyDoc comments - For cubed-sphere grids, cap the lookup latitude at +/- 89.75 so that the a GCHP grid box can be found for a given (lon,lat) - Cap the y-axis range at 80 ppbv - Set y-axis tickmarks at 0, 20, 40, 60, 80 ppbv gcpy/cstools.py - Update PyDoc and comments with a better description of jitter_size Signed-off-by: Bob Yantosca --- benchmark/modules/benchmark_models_vs_obs.py | 354 +++++++++++++------ gcpy/cstools.py | 18 +- 2 files changed, 253 insertions(+), 119 deletions(-) diff --git a/benchmark/modules/benchmark_models_vs_obs.py b/benchmark/modules/benchmark_models_vs_obs.py index 531069f2..06b0b07a 100644 --- a/benchmark/modules/benchmark_models_vs_obs.py +++ b/benchmark/modules/benchmark_models_vs_obs.py @@ -22,7 +22,8 @@ import numpy as np import xarray as xr from gcpy.constants import skip_these_vars -from gcpy.util import dataset_reader, make_directory, reshape_MAPL_CS +from gcpy.util import verify_variable_type, dataset_reader, make_directory +from gcpy.cstools import extract_grid, find_index, is_cubed_sphere def read_nas( input_file, @@ -53,8 +54,7 @@ def read_nas( obs_site_coords : dict Dictionary containing formatted site name: lon, lat and altitude. """ - if not isinstance(input_file, str): - raise TypeError("Argument 'input_file' is not of type str!") + verify_variable_type(input_file, str) if verbose: print(f"read_nas: Reading {input_file}") @@ -160,8 +160,7 @@ def read_observational_data( obs_site_coords : dict Dictionary with coordinates of each observation site """ - if not isinstance(path, str): - raise TypeError("The 'path' argument is not of type str!") + verify_variable_type(path, str) first = True obs_site_coords = {} @@ -265,18 +264,11 @@ def read_model_data( raise exc(msg) from exc # Create a DataArray object and convert to ppbv (if necessary) - # Reshape GCHP data so that it has "lon", "lat" dimensions, - # which will facilitate data handling elsewhere in this module. with xr.set_options(keep_attrs=True): dataarray = dataset[varname] if "mol mol-1" in dataarray.attrs["units"]: dataarray.values *= 1.0e9 dataarray.attrs["units"] = "ppbv" - if "nf" in dataarray.dims: - dataarray = reshape_MAPL_CS( - dataarray, - multi_index_lat=False - ) return dataarray @@ -318,22 +310,97 @@ def find_times( return obs_dataframe, qcflag -def find_nearest_3d( +def get_nearest_model_data_to_obs_cs( gc_data, + gc_cs_grid, gc_level_alts_m, lon_value, lat_value, alt_value ): """ - Find GEOS-Chem gridbox closest to the observational dataset. - Uses lat, lon and alt from obs to select most appropriate GC data. + Returns GEOS-Chem model data (on a cubed-sphere grid) at the + grid box closest to an observation site location. + + Args: + ----- + gc_data : xarray DataArray + GEOS-Chem output to be processed + + gc_cs_grid: xarray Dataset + Coordinate arrays defining the cubed-sphere grid. + + gc_level_alts_m: pandas Series + Altitudes of GEOS-Chem levels in meters + + lon_value : float + GAW site longitude + + lat_value : float + GAW site latitude + + alt_value : float + GAW site altitude + + Keyword Args: + ------------- + + Returns: + -------- + dataframe: pandas.DataFrame + Model data closest to the observation site. + """ + verify_variable_type(gc_data, xr.DataArray) + verify_variable_type(gc_cs_grid, xr.Dataset) + verify_variable_type(gc_level_alts_m, pd.Series) + + # Prevent the latitude from getting too close to the N or S poles + lat_value = max(min(lat_value, 89.75), -89.75) + + # Indices (nf, yInd, xInd) of box nearest to observation site + cs_indices = find_index( + lat_value, + lon_value, + gc_cs_grid + ) + + # Index of nearest vertical levle to observation site + z_idx=( + np.abs( + gc_level_alts_m.values - float(alt_value) + ) + ).argmin() + + return gc_data.isel( + nf=cs_indices[0, 0], + Ydim=cs_indices[1, 0], + Xdim=cs_indices[2, 0], + lev=z_idx + ).to_dataframe() + + +def get_nearest_model_data_to_obs_ll( + gc_data, + gc_cs_grid, + gc_level_alts_m, + lon_value, + lat_value, + alt_value, + +): + """ + Returns GEOS-Chem model data (on a cubed-sphere grid) at the + grid box closest to an observation site location. Args: ----- gc_data : xarray DataSet GEOS-Chem output to be processed + gc_cs_grid : NoneType + Dummy variable (needed to make the argument list the + same as in get_nearest_model_data_to_obs_ll). + gc_level_alts_m: pandas Series Altitudes of GEOS-Chem levels in meters @@ -348,10 +415,12 @@ def find_nearest_3d( Returns: -------- - x_idx, y_idx, z_idx : numpy.int64 - GEOS-Chem grid box indices for the single gridbox - closest to GAW site specifications + dataframe: pandas.DataFrame + Model data closest to the observation site. """ + verify_variable_type(gc_data, xr.DataArray) + verify_variable_type(gc_cs_grid, type(None)) + verify_variable_type(gc_level_alts_m, pd.Series) x_idx=( np.abs( @@ -371,7 +440,39 @@ def find_nearest_3d( ) ).argmin() - return x_idx, y_idx, z_idx + return gc_data.isel( + lon=x_idx, + lat=y_idx, + lev=z_idx + ).to_dataframe() + + +def which_finder_function( + data +): + """ + Returns the function that will be used to get the model data nearest + to the observation site. The function that is returned depends on + whether the model grid is lat-lon or cubed-sphere, as different + handling needs to be applied to each grid + + Args: + ----- + data : xarray.DataArray + Model data + + Returns: + -------- + A reference to the function that will read the data, depending + on whether the data is placed on a cubed-sphere grid or on + a lat-lon grid. + """ + verify_variable_type(data, (xr.DataArray, xr.Dataset)) + + if is_cubed_sphere(data): + return get_nearest_model_data_to_obs_cs + + return get_nearest_model_data_to_obs_ll def get_geoschem_level_metadata( @@ -428,9 +529,12 @@ def prepare_data_for_plot( obs_site_coords, obs_site_name, ref_dataarray, + ref_cs_grid, dev_dataarray, + dev_cs_grid, gc_level_alts_m, - varname="SpeciesConcVV_O3" + varname="SpeciesConcVV_O3", + **kwargs, ): """ Prepares data for passing to routine plot_single_frames as follows: @@ -454,10 +558,12 @@ def prepare_data_for_plot( ref_dataarray, dev_dataarray : xarray DataArray Data from the Ref and Dev model versions. - ref_label, dev_label: str - Labels describing the Ref and Dev datasets (e.g. version numbers) + ref_cs_grid, dev_cs_grid : xarray.Dataset or NoneType + Dictionary containing the cubed-sphere grid definitions for + ref_dataarray and dev_dataarray (or None if ref_dataarray or + dev_dataarray are not placed on a cubed-sphere grid). - gc_level_alts_m : pandas DataFrame + gc_level_alts_m : pandas Series Metadata pertaining to GEOS-Chem vertical levels Keyword Args (Optional) @@ -481,34 +587,37 @@ def prepare_data_for_plot( subplot_ylabel : str Label for the Y-axis (e.g. species name). """ - - # Get Ref model data nearest to the observation site - x_idx, y_idx, z_idx = find_nearest_3d( + verify_variable_type(obs_dataframe, pd.DataFrame) + verify_variable_type(obs_site_coords, dict) + verify_variable_type(obs_site_name, str) + verify_variable_type(ref_dataarray, xr.DataArray) + verify_variable_type(dev_dataarray, xr.DataArray) + verify_variable_type(ref_cs_grid, (xr.Dataset, type(None))) + verify_variable_type(dev_cs_grid, (xr.Dataset, type(None))) + verify_variable_type(gc_level_alts_m, pd.Series) + verify_variable_type(varname, str) + + # Get data from the Ref model closest to the data site + finder_function = which_finder_function(ref_dataarray) + ref_dataframe = finder_function( ref_dataarray, + ref_cs_grid, gc_level_alts_m, lon_value=round(obs_site_coords[obs_site_name]['lon'], 2), lat_value=round(obs_site_coords[obs_site_name]['lat'], 2), alt_value=round(obs_site_coords[obs_site_name]['alt'], 1) ) - ref_dataframe = ref_dataarray.isel( - lon=x_idx, - lat=y_idx, - lev=z_idx - ).to_dataframe() - # Get Dev model data nearest to the observation site - x_idx, y_idx, z_idx = find_nearest_3d( + # Get data from the Dev model closest to the obs site + finder_function = which_finder_function(dev_dataarray) + dev_dataframe = finder_function( dev_dataarray, + dev_cs_grid, gc_level_alts_m, lon_value=round(obs_site_coords[obs_site_name]['lon'], 2), lat_value=round(obs_site_coords[obs_site_name]['lat'], 2), alt_value=round(obs_site_coords[obs_site_name]['alt'], 1) ) - dev_dataframe = dev_dataarray.isel( - lon=x_idx, - lat=y_idx, - lev=z_idx - ).to_dataframe() # Take the monthly mean of observations for plotting # (since some observation sites have multiple months of data) @@ -548,7 +657,8 @@ def plot_single_station( ref_series, ref_label, dev_series, - dev_label + dev_label, + **kwargs ): """ Plots observation data vs. model data at a single station site. @@ -582,21 +692,17 @@ def plot_single_station( Descriptive labels (e.g. version numbers) for the GEOS-Chem Ref and Dev model versions. """ - if not isinstance(fig, Figure): - msg = "The 'fig' argument is not of type matplotlib.figure.Figure!" - if not isinstance(cols_per_page, int): - msg = "The 'cols_per_page' argument is not of type int!" - if not isinstance(rows_per_page, int): - msg = "The 'rows_per_page' argument is not of type int!" - if not isinstance(obs_dataframe, pd.DataFrame): - msg = "The 'obs_dataframe' argument is not of type pandas.DataFrame!" - raise TypeError(msg) - if not isinstance(ref_series, pd.Series): - msg = "The 'ref_series' argument is not of type pandas.Series!" - raise TypeError(msg) - if not isinstance(dev_series, pd.Series): - msg = "The 'ref_series' argument is not of type pandas.Series!" - raise TypeError(msg) + verify_variable_type(fig, Figure) + verify_variable_type(rows_per_page, int) + verify_variable_type(cols_per_page, int) + verify_variable_type(subplot_index, int) + verify_variable_type(subplot_title, str) + verify_variable_type(subplot_ylabel, str) + verify_variable_type(obs_dataframe, pd.DataFrame) + verify_variable_type(ref_series, pd.Series) + verify_variable_type(ref_label, str) + verify_variable_type(dev_series, pd.Series) + verify_variable_type(dev_label, str) # Create matplotlib axes object for this subplot # axes_subplot is of type matplotlib.axes_.subplots.AxesSubplot @@ -664,10 +770,10 @@ def plot_single_station( ) axes_subplot.set_ylim( 0, - 100 + 80 ) axes_subplot.set_yticks( - [0, 25, 50, 75, 100] + [0, 20, 40, 60, 80] ) axes_subplot.tick_params( axis='both', @@ -683,12 +789,15 @@ def plot_one_page( obs_site_names, ref_dataarray, ref_label, + ref_cs_grid, dev_dataarray, dev_label, + dev_cs_grid, gc_level_alts_m, rows_per_page=3, cols_per_page=3, varname="SpeciesConcVV_O3", + **kwargs ): """ Plots a single page of models vs. observations. @@ -710,6 +819,11 @@ def plot_one_page( ref_label, dev_label: str Labels describing the Ref and Dev datasets (e.g. version numbers) + ref_cs_grid, dev_cs_grid : xarray.Dataset or NoneType + Dictionary containing the cubed-sphere grid definitions for + ref_dataarray and dev_dataarray (or None if ref_dataarray or + dev_dataarray are not placed on a cubed-sphere grid). + gc_level_alts_m : pandas DataFrame Metadata pertaining to GEOS-Chem vertical levels @@ -728,27 +842,16 @@ def plot_one_page( Toggles verbose printout on (True) or off (False). Default value: False """ - if not isinstance(obs_dataframe, pd.DataFrame): - msg = "The 'obs_dataframe' argument is not of type pandas.DataFrame!" - raise TypeError(msg) - if not isinstance(obs_site_coords, dict): - msg = "The 'obs_site_coords' argument is not of type dict!" - raise TypeError(msg) - if not isinstance(ref_dataarray, xr.DataArray): - msg = "The 'ref_dataset' argument is not of type xarray.DataArray!" - raise TypeError(msg) - if not isinstance(ref_label, str): - msg = "The 'ref_label' argument is not of type str!" - raise TypeError(msg) - if not isinstance(dev_dataarray, xr.DataArray): - msg = "The 'ref_dataset' argument is not of type xarray.DataArray!" - raise TypeError(msg) - if not isinstance(dev_label, str): - msg = "The 'dev_label' argument is not of type str!" - raise TypeError(msg) - if not isinstance(gc_level_alts_m, pd.Series): - msg = "The 'gc_level_alts_m' argument is not of type pandas.Series!" - raise TypeError(msg) + verify_variable_type(obs_dataframe, pd.DataFrame) + verify_variable_type(obs_site_coords, dict) + verify_variable_type(obs_site_names, list) + verify_variable_type(ref_dataarray, xr.DataArray) + verify_variable_type(ref_label, str) + verify_variable_type(ref_cs_grid, (xr.Dataset, type(None))) + verify_variable_type(dev_dataarray, xr.DataArray) + verify_variable_type(dev_label, str) + verify_variable_type(dev_cs_grid, (xr.Dataset, type(None))) + verify_variable_type(gc_level_alts_m, pd.Series) # Define a new matplotlib.figure.Figure object for this page # Landscape width: 11" x 8" @@ -768,9 +871,12 @@ def plot_one_page( obs_site_coords, # dict obs_site_name, # str ref_dataarray, # xarray.DataArray + ref_cs_grid, # dict or none dev_dataarray, # xarray.DataArray + dev_cs_grid, # dict or none gc_level_alts_m, # pandas.Series varname=varname, # str + **kwargs ) # Plot models vs. observation for a single station site @@ -786,7 +892,8 @@ def plot_one_page( ref_series, # pandas.Series ref_label, # str dev_series, # pandas.Series - dev_label # str + dev_label, # str + **kwargs ) # Add extra spacing around plots @@ -817,7 +924,7 @@ def plot_models_vs_obs( gc_level_alts_m, varname="SpeciesConcVV_O3", dst="./benchmark", - verbose=False + **kwargs ): """ Plots models vs. observations using a 3 rows x 3 column layout. @@ -853,24 +960,18 @@ def plot_models_vs_obs( Toggles verbose printout on (True) or off (False). Default value: False """ - if not isinstance(obs_dataframe, pd.DataFrame): - msg = "The 'obs_dataframe' argument is not of type pandas.DataFrame!" - raise TypeError(msg) - if not isinstance(ref_dataarray, xr.DataArray): - msg = "The 'ref_dataset' argument is not of type xarray.DataArray!" - raise TypeError(msg) - if not isinstance(ref_label, str): - msg = "The 'ref_label' argument is not of type str!" - raise TypeError(msg) - if not isinstance(dev_dataarray, xr.DataArray): - msg = "The 'ref_dataset' argument is not of type xarray.DataArray!" - raise TypeError(msg) - if not isinstance(dev_label, str): - msg = "The 'dev_label' argument is not of type str!" - raise TypeError(msg) - if not isinstance(gc_level_alts_m, pd.Series): - msg = "The 'gc_level_alts_m' argument is not of type pandas.Series!" - raise TypeError(msg) + verify_variable_type(obs_dataframe, pd.DataFrame) + verify_variable_type(obs_site_coords, dict) + verify_variable_type(ref_dataarray, xr.DataArray) + verify_variable_type(ref_label, str) + verify_variable_type(dev_dataarray, xr.DataArray) + verify_variable_type(dev_label, str) + verify_variable_type(gc_level_alts_m, pd.Series) + + # Get the cubed-sphere grid definitions for Ref & Dev + # (will be returned as "None" for lat/lon grids) + ref_cs_grid = extract_grid(ref_dataarray) + dev_cs_grid = extract_grid(dev_dataarray) # Figure setup plt.style.use('seaborn-darkgrid') @@ -906,12 +1007,15 @@ def plot_models_vs_obs( obs_site_names[start:end+1], # list of str ref_dataarray, # xarray.DataArray ref_label, # str + ref_cs_grid, # xarray.DataSet or NoneType dev_dataarray, # xarray.DataArray dev_label, # str + dev_cs_grid, # xarray.Dataset or NoneType gc_level_alts_m, # pandas.Series rows_per_page=rows_per_page, # int cols_per_page=cols_per_page, # int - varname=varname # str + varname=varname, # str + **kwargs ) # Close the PDF file after all pages are plotted. @@ -930,26 +1034,42 @@ def make_benchmark_models_vs_obs_plots( overwrite=False ): """ - Driver routine to create plots + Driver routine to create model vs. observation plots. + + Args: + ----- + obs_filepaths : str or list + Path(s) to the observational data. + + ref_filepaths, dev_filepaths: str or list + Path(s) to the Ref and Dev model versions to be compared. + + ref_label, dev_label : str + Descriptive labels (e.g. for version numbers) for the + Ref and Dev model data. + + Keyword Args (optional): + ------------------------ + varname : str + Variable name for model data to be plotted against + observations. Default value: "SpeciesConcVV_O3". + + dst : str + Path to the root folder where plots will be created. + + verbose : bool + Toggles verbose printout on (True) or off (False). + Default value: False + + overwrite : bool + Toggles whether plots should be overwritten (True) + or not (False). Default value: True """ - if not isinstance(obs_filepaths, list) and \ - not isinstance(obs_filepaths, str): - msg = "The 'obs_filepaths' argument is not of type 'list' or 'str'!" - raise TypeError(msg) - if not isinstance(ref_filepaths, list) and \ - not isinstance(ref_filepaths, str): - msg = "The 'ref_filepaths' argument is not of type 'list' or 'str'!" - raise TypeError(msg) - if not isinstance(ref_label, str): - msg = "The 'ref_label' argument is not of type 'str'!" - raise TypeError(msg) - if not isinstance(dev_filepaths, list) and \ - not isinstance(dev_filepaths, str): - msg = "The 'dev_filepaths' argument is not of type 'list' or 'str'!" - raise TypeError(msg) - if not isinstance(ref_label, str): - msg = "The 'dev_label' argument is not of type 'str'!" - raise TypeError(msg) + verify_variable_type(obs_filepaths, (str, list)) + verify_variable_type(ref_filepaths, (str, list)) + verify_variable_type(ref_label, str) + verify_variable_type(dev_filepaths, (str, list)) + verify_variable_type(dev_label, str) # Create the destination folder make_directory( diff --git a/gcpy/cstools.py b/gcpy/cstools.py index 8acced36..57be0619 100644 --- a/gcpy/cstools.py +++ b/gcpy/cstools.py @@ -495,7 +495,11 @@ def find_index_single( Ouptut of pyproj.Proj("+proj=latlon") jitter_size : float - ?? + If the point cannot be matched to a cubed-sphere grid box, + then shift longitude by the distance [m] specified in + jitter_size before doing the lookup once more. A nonzero + jitter_size value may be needed when the latitude is close + to +90 or -90. Returns: -------- @@ -546,9 +550,10 @@ def find_index_single( polygon.contains(xy_find_gno) for polygon in four_nearest_polygons_gno ] + # If the point cannot be matched (such as can happen near the poles), + # move the longitude by the jitter_size (in meters) and try again. if np.count_nonzero(polygon_contains_point) == 0: if jitter_size > 0.0: - # Move longitude by ~1 m nf_cs, ydim_cs, xdim_cs = find_index_single( y_find, x_find+jitter_size, @@ -601,6 +606,15 @@ def find_index( 'lon_b' : lon edges} where each value has an extra face dimension of length 6. + Keyword Args (optional): + ------------------------ + jitter_size : float + If the point cannot be matched to a cubed-sphere grid box, + then shift longitude by the distance [m] specified in + jitter_size before doing the lookup once more. A nonzero + jitter_size value may be needed when the latitude is close + to +90 or -90. Default value: 0 + Returns: -------- ind : numpy.ndarray From 525e8fdec6a886cc28d7bb87f8cc353c3357c689 Mon Sep 17 00:00:00 2001 From: Bob Yantosca Date: Thu, 27 Jul 2023 12:35:54 -0400 Subject: [PATCH 6/7] Minor updates in grid.py and util.py gcpy/grid.py - Remove inaccurate coment in verify_variable_type gcpy/util.py - Add "import numpy as np" instead of just importing individual numpy functions Signed-off-by: Bob Yantosca --- gcpy/grid.py | 9 ++++----- gcpy/util.py | 2 -- 2 files changed, 4 insertions(+), 7 deletions(-) diff --git a/gcpy/grid.py b/gcpy/grid.py index 3a8622d4..c4d8be5e 100644 --- a/gcpy/grid.py +++ b/gcpy/grid.py @@ -1,6 +1,5 @@ -import numpy as np import xarray as xr -from numpy import asarray +import numpy as np import scipy.sparse from itertools import product from .util import get_shape_of_data @@ -922,8 +921,8 @@ def calc_rectilinear_grid_area(lon_edge, lat_edge): # Convert from km to m _radius_earth_m = R_EARTH_m - lon_edge = asarray(lon_edge, dtype=float) - lat_edge = asarray(lat_edge, dtype=float) + lon_edge = np.asarray(lon_edge, dtype=float) + lat_edge = np.asarray(lat_edge, dtype=float) n_lon = (lon_edge.size) - 1 n_lat = (lat_edge.size) - 1 @@ -967,7 +966,7 @@ def calc_delta_lon(lon_edge): n_lon = (lon_edge.size) - 1 - lon_edge = asarray(lon_edge) + lon_edge = np.asarray(lon_edge) # Set up output array lon_delta = np.zeros((n_lon)) diff --git a/gcpy/util.py b/gcpy/util.py index e4311d6b..0cfcf91c 100644 --- a/gcpy/util.py +++ b/gcpy/util.py @@ -2444,8 +2444,6 @@ def verify_variable_type( A single type definition (list, str, pandas.Series, etc.) or a tuple of type definitions. """ - - # var_type is a list of types if isinstance(var, var_type): return raise TypeError( f"{var} is not of type: {var_type}!") From ef4304628389e6c9eabeefa9ef122e0e6754a1cc Mon Sep 17 00:00:00 2001 From: Bob Yantosca Date: Thu, 27 Jul 2023 13:09:59 -0400 Subject: [PATCH 7/7] Updated CHANGELOG.md for latest models vs. obs new features CHANGELOG.md - Added blurb about new verify_variable_type function - Minor edits to fix typos Signed-off-by: Bob Yantosca --- CHANGELOG.md | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/CHANGELOG.md b/CHANGELOG.md index 3b907240..fbec1a3e 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -20,8 +20,9 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/), - Added `benchmark/modules/GC_72_vertical_levels.csv` file - Added `multi_index_lat` keyword to `reshape_MAPL_CS` function in `gcpy/util.py` - Added FURA to `emission_species.yml` and `benchmark_categories.yml` -- Added new routine `format_number_for_table` in `util.py` +- Added new routine `format_number_for_table` in `gcpy/util.py` - Added module `gcpy/cstools.py` with utility functions for cubed-sphere grids +- Added new routine `verify_variable_type` function in `gcpy/util.py` ### Changed - Simplified the Github issues templates into two options: `new-feature-or-discussion.md` and `question-issue.md` @@ -41,7 +42,7 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/), ### Fixed - Generalized test for GCHP or GCClassic restart file in `regrid_restart_file.py` - Fixed bug in transport tracer benchmark mass conservation table file write -- Routine `create_display _name` now splits on only the first `_` in species & diag names +- Routine `create_display_name` now splits on only the first `_` in species & diag names ### Removed - Removed `gchp_is_pre_13_1` arguments & code from benchmarking routines