Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

test: cf checker #127

Merged
merged 13 commits into from
Sep 17, 2024
Binary file removed ARCO_smaller_area_subset_method_default.nc
Binary file not shown.
1 change: 1 addition & 0 deletions conda_environment_test.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -7,6 +7,7 @@ dependencies:
- tox==4.11.4
- netcdf4==1.6.5
- syrupy==4.6.1
- compliance-checker==5.1.1
- pip:
- pytest-order==1.2.1
- freezegun==1.5.1
6 changes: 4 additions & 2 deletions copernicusmarine/download_functions/subset_xarray.py
Original file line number Diff line number Diff line change
Expand Up @@ -434,10 +434,12 @@ def _adequate_dtypes_of_valid_minmax(
dataset: xarray.Dataset, variable: str
) -> xarray.Dataset:
dataset[variable].attrs["valid_min"] = numpy.array(
[dataset[variable].attrs["valid_min"]], dtype=dataset[variable].dtype
[dataset[variable].attrs["valid_min"]],
dtype=dataset[variable].encoding["dtype"],
Comment on lines +437 to +438
Copy link
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Nice! maybe you should talk with Guille anyway about this if the valid minmax that comes from arco is different then the variable normal value

Copy link
Collaborator Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

well, all of them have the same format (if int, int, if float, float) but the precision might be different... I'll ask anyway, yes!

)[0]
dataset[variable].attrs["valid_max"] = numpy.array(
[dataset[variable].attrs["valid_max"]], dtype=dataset[variable].dtype
[dataset[variable].attrs["valid_max"]],
dtype=dataset[variable].encoding["dtype"],
)[0]
return dataset

Expand Down
Empty file removed example.py
Empty file.
31 changes: 31 additions & 0 deletions tests/__snapshots__/test_cf_compliance.ambr
Original file line number Diff line number Diff line change
@@ -0,0 +1,31 @@
# serializer version: 1
# name: TestCFCompliance.test_subset_open
'cmems_mod_nws_bgc-pft_my_7km-3D-pico_P1M-m'
# ---
# name: TestCFCompliance.test_subset_open.1
160
# ---
# name: TestCFCompliance.test_subset_open.2
160
# ---
# name: TestCFCompliance.test_subset_open.3
list([
])
# ---
# name: TestCFCompliance.test_subset_with_warns
'cmems_obs-sst_med_phy-sst_nrt_diurnal-oi-0.0625deg_PT1H-m'
# ---
# name: TestCFCompliance.test_subset_with_warns.1
135
# ---
# name: TestCFCompliance.test_subset_with_warns.2
136
# ---
# name: TestCFCompliance.test_subset_with_warns.3
list([
'§2.6 Attributes',
list([
'§2.6.1 Conventions global attribute does not contain "CF-1.6"',
]),
])
# ---
76 changes: 76 additions & 0 deletions tests/test_cf_compliance.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,76 @@
import json

import xarray

from copernicusmarine import subset
from tests.test_utils import execute_in_terminal


class TestCFCompliance:
def test_subset_open(self, tmp_path, snapshot):
dataset_id = "cmems_mod_nws_bgc-pft_my_7km-3D-pico_P1M-m"
self.if_I_subset_a_dataset(dataset_id, tmp_path, "output_1.nc", "pico")
self.then_it_is_cf_compliant(
dataset_id, tmp_path, snapshot, "output_1"
)

def test_subset_with_warns(self, tmp_path, snapshot):
dataset_id = (
"cmems_obs-sst_med_phy-sst_nrt_diurnal-oi-0.0625deg_PT1H-m"
)
self.if_I_subset_a_dataset(
dataset_id,
tmp_path,
"output_2.nc",
"analysed_sst",
)
self.then_it_is_cf_compliant(
dataset_id, tmp_path, snapshot, "output_2"
)

def if_I_subset_a_dataset(
self, dataset_id, tmp_path, output_filename, variable
):
subset(
dataset_id=dataset_id,
variables=[variable],
output_directory=tmp_path,
output_filename=output_filename,
start_datetime="2022-01-01T00:00:00",
end_datetime="2022-01-05T00:00:00",
force_download=True,
)
assert (tmp_path / output_filename).exists()

def then_it_is_cf_compliant(
self, dataset_id, tmp_path, snapshot, output_filename
):
dataset_id = dataset_id
dataset = xarray.open_dataset(f"{tmp_path}/{output_filename}.nc")
CF_convention = dataset.attrs["Conventions"][-3:]
if CF_convention < "1.6":
CF_convention = "1.6"
command = [
"compliance-checker",
f"--test=cf:{CF_convention}",
f"{tmp_path}/{output_filename}.nc",
"-f",
"json",
"-o",
f"{tmp_path}/{output_filename}_checked.json",
]
execute_in_terminal(command)

f = open(f"{tmp_path}/{output_filename}_checked.json")
data = json.load(f)

list_msgs = []
for diccionari in data[f"cf:{CF_convention}"]["all_priorities"]:
if len(diccionari["msgs"]) > 0:
list_msgs.append(diccionari["name"])
list_msgs.append(diccionari["msgs"])

assert dataset_id == snapshot
assert data[f"cf:{CF_convention}"]["scored_points"] == snapshot
assert data[f"cf:{CF_convention}"]["possible_points"] == snapshot
assert list_msgs == snapshot