From 689b0ca4cdb969fcd27c779e0e86f5f12bf9401b Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Wed, 6 Sep 2023 15:49:02 +0200
Subject: [PATCH 01/33] [skip-ci]

---
 docs/whats-new.rst | 7 +++++++
 1 file changed, 7 insertions(+)

diff --git a/docs/whats-new.rst b/docs/whats-new.rst
index 228b8c25..97b13938 100644
--- a/docs/whats-new.rst
+++ b/docs/whats-new.rst
@@ -8,6 +8,13 @@ What's New
 |pypi dwn| |conda dwn|
 
 
+Coming up next
+--------------
+
+**Internals**
+
+- Utilities refactoring. Each class/function have been refactored in more appropriate locations like ``argopy.utils`` or ``argopy.relatec``.
+
 v0.1.14rc2 (27 Jul. 2023)
 -------------------------
 

From 3e490333a2da5138f66f5d9daed1f3fd0b67942d Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Wed, 6 Sep 2023 15:56:28 +0200
Subject: [PATCH 02/33] Move TopoFetcher to argopy.related

---
 argopy/__init__.py         |   3 +-
 argopy/related/__init__.py |   7 ++
 argopy/related/topo.py     | 203 +++++++++++++++++++++++++++++++++++++
 argopy/utilities.py        | 200 ------------------------------------
 4 files changed, 212 insertions(+), 201 deletions(-)
 create mode 100644 argopy/related/__init__.py
 create mode 100644 argopy/related/topo.py

diff --git a/argopy/__init__.py b/argopy/__init__.py
index e0020728..7a90d217 100644
--- a/argopy/__init__.py
+++ b/argopy/__init__.py
@@ -35,12 +35,13 @@
 from . import plot  # noqa: E402
 from .plot import dashboard, ArgoColors  # noqa: E402
 from .utilities import show_versions, show_options, clear_cache, lscache  # noqa: E402
-from .utilities import TopoFetcher, ArgoNVSReferenceTables, OceanOPSDeployments, ArgoDocs  # noqa: E402
+from .utilities import ArgoNVSReferenceTables, OceanOPSDeployments, ArgoDocs  # noqa: E402
 from .utilities import monitor_status as status  # noqa: E402
 from .options import set_options, reset_options  # noqa: E402
 from .data_fetchers import CTDRefDataFetcher  # noqa: E402
 from .stores import ArgoIndex  # noqa: E402
 from .utils import compute  # noqa: E402, F401
+from .related import TopoFetcher # noqa: E402
 
 #
 __all__ = (
diff --git a/argopy/related/__init__.py b/argopy/related/__init__.py
new file mode 100644
index 00000000..58c3812e
--- /dev/null
+++ b/argopy/related/__init__.py
@@ -0,0 +1,7 @@
+from .topo import TopoFetcher
+
+#
+__all__ = (
+    # Classes:
+    "TopoFetcher",
+)
\ No newline at end of file
diff --git a/argopy/related/topo.py b/argopy/related/topo.py
new file mode 100644
index 00000000..39b7f4b1
--- /dev/null
+++ b/argopy/related/topo.py
@@ -0,0 +1,203 @@
+from typing import Union
+from ..options import OPTIONS
+from ..stores import httpstore
+from ..utilities import format_oneline
+
+
+class TopoFetcher:
+    """ Fetch topographic data through an ERDDAP server for an ocean rectangle
+
+    Example:
+        >>> from argopy import TopoFetcher
+        >>> box = [-75, -45, 20, 30]  # Lon_min, lon_max, lat_min, lat_max
+        >>> ds = TopoFetcher(box).to_xarray()
+        >>> ds = TopoFetcher(box, ds='gebco', stride=[10, 10], cache=True).to_xarray()
+
+    """
+
+    class ERDDAP:
+        def __init__(self, server: str, protocol: str = "tabledap"):
+            self.server = server
+            self.protocol = protocol
+            self.response = "nc"
+            self.dataset_id = ""
+            self.constraints = ""
+
+    def __init__(
+        self,
+        box: list,
+        ds: str = "gebco",
+        cache: bool = False,
+        cachedir: str = "",
+        api_timeout: int = 0,
+        stride: list = [1, 1],
+        server: Union[str] = None,
+        **kwargs,
+    ):
+        """ Instantiate an ERDDAP topo data fetcher
+
+        Parameters
+        ----------
+        ds: str (optional), default: 'gebco'
+            Dataset to load:
+
+            - 'gebco' will load the GEBCO_2020 Grid, a continuous terrain model for oceans and land at 15 arc-second intervals
+        stride: list, default [1, 1]
+            Strides along longitude and latitude. This allows to change the output resolution
+        cache: bool (optional)
+            Cache data or not (default: False)
+        cachedir: str (optional)
+            Path to cache folder
+        api_timeout: int (optional)
+            Erddap request time out in seconds. Set to OPTIONS['api_timeout'] by default.
+        """
+        timeout = OPTIONS["api_timeout"] if api_timeout == 0 else api_timeout
+        self.fs = httpstore(
+            cache=cache, cachedir=cachedir, timeout=timeout, size_policy="head"
+        )
+        self.definition = "Erddap topographic data fetcher"
+
+        self.BOX = box
+        self.stride = stride
+        if ds == "gebco":
+            self.definition = "NOAA erddap gebco data fetcher for a space region"
+            self.server = server if server is not None else "https://coastwatch.pfeg.noaa.gov/erddap"
+            self.server_name = "NOAA"
+            self.dataset_id = "gebco"
+
+        self._init_erddap()
+
+    def _init_erddap(self):
+        # Init erddap
+        self.erddap = self.ERDDAP(server=self.server, protocol="griddap")
+        self.erddap.response = "nc"
+
+        if self.dataset_id == "gebco":
+            self.erddap.dataset_id = "GEBCO_2020"
+        else:
+            raise ValueError(
+                "Invalid database short name for %s erddap" % self.server_name
+            )
+        return self
+
+    def _cname(self) -> str:
+        """ Fetcher one line string definition helper """
+        cname = "?"
+
+        if hasattr(self, "BOX"):
+            BOX = self.BOX
+            cname = ("[x=%0.2f/%0.2f; y=%0.2f/%0.2f]") % (
+                BOX[0],
+                BOX[1],
+                BOX[2],
+                BOX[3],
+            )
+        return cname
+
+    def __repr__(self):
+        summary = ["<topofetcher.erddap>"]
+        summary.append("Name: %s" % self.definition)
+        summary.append("API: %s" % self.server)
+        summary.append("Domain: %s" % format_oneline(self.cname()))
+        return "\n".join(summary)
+
+    def cname(self):
+        """ Return a unique string defining the constraints """
+        return self._cname()
+
+    @property
+    def cachepath(self):
+        """ Return path to cached file(s) for this request
+
+        Returns
+        -------
+        list(str)
+        """
+        return [self.fs.cachepath(uri) for uri in self.uri]
+
+    def define_constraints(self):
+        """ Define request constraints """
+        #        Eg: https://coastwatch.pfeg.noaa.gov/erddap/griddap/GEBCO_2020.nc?elevation%5B(34):5:(42)%5D%5B(-21):7:(-12)%5D
+        self.erddap.constraints = "%s(%0.2f):%i:(%0.2f)%s%s(%0.2f):%i:(%0.2f)%s" % (
+            "%5B",
+            self.BOX[2],
+            self.stride[1],
+            self.BOX[3],
+            "%5D",
+            "%5B",
+            self.BOX[0],
+            self.stride[0],
+            self.BOX[1],
+            "%5D",
+        )
+        return None
+
+    #     @property
+    #     def _minimal_vlist(self):
+    #         """ Return the minimal list of variables to retrieve """
+    #         vlist = list()
+    #         vlist.append("latitude")
+    #         vlist.append("longitude")
+    #         vlist.append("elevation")
+    #         return vlist
+
+    def url_encode(self, url):
+        """ Return safely encoded list of urls
+
+            This is necessary because fsspec cannot handle in cache paths/urls with a '[' character
+        """
+
+        # return urls
+        def safe_for_fsspec_cache(url):
+            url = url.replace("[", "%5B")  # This is the one really necessary
+            url = url.replace("]", "%5D")  # For consistency
+            return url
+
+        return safe_for_fsspec_cache(url)
+
+    def get_url(self):
+        """ Return the URL to download data requested
+
+        Returns
+        -------
+        str
+        """
+        # First part of the URL:
+        protocol = self.erddap.protocol
+        dataset_id = self.erddap.dataset_id
+        response = self.erddap.response
+        url = f"{self.erddap.server}/{protocol}/{dataset_id}.{response}?"
+
+        # Add variables to retrieve:
+        variables = ["elevation"]
+        variables = ",".join(variables)
+        url += f"{variables}"
+
+        # Add constraints:
+        self.define_constraints()  # Define constraint to select this box of data (affect self.erddap.constraints)
+        url += f"{self.erddap.constraints}"
+
+        return self.url_encode(url)
+
+    @property
+    def uri(self):
+        """ List of files to load for a request
+
+        Returns
+        -------
+        list(str)
+        """
+        return [self.get_url()]
+
+    def to_xarray(self, errors: str = "ignore"):
+        """ Load Topographic data and return a xarray.DataSet """
+
+        # Download data
+        if len(self.uri) == 1:
+            ds = self.fs.open_dataset(self.uri[0])
+
+        return ds
+
+    def load(self, errors: str = "ignore"):
+        """ Load Topographic data and return a xarray.DataSet """
+        return self.to_xarray(errors=errors)
diff --git a/argopy/utilities.py b/argopy/utilities.py
index 777a8dab..9ff569f9 100644
--- a/argopy/utilities.py
+++ b/argopy/utilities.py
@@ -2042,206 +2042,6 @@ def _subsample_bins(x, y, target_values):
     return remapped
 
 
-class TopoFetcher:
-    """ Fetch topographic data through an ERDDAP server for an ocean rectangle
-
-    Example:
-        >>> from argopy import TopoFetcher
-        >>> box = [-75, -45, 20, 30]  # Lon_min, lon_max, lat_min, lat_max
-        >>> ds = TopoFetcher(box).to_xarray()
-        >>> ds = TopoFetcher(box, ds='gebco', stride=[10, 10], cache=True).to_xarray()
-
-    """
-
-    class ERDDAP:
-        def __init__(self, server: str, protocol: str = "tabledap"):
-            self.server = server
-            self.protocol = protocol
-            self.response = "nc"
-            self.dataset_id = ""
-            self.constraints = ""
-
-    def __init__(
-        self,
-        box: list,
-        ds: str = "gebco",
-        cache: bool = False,
-        cachedir: str = "",
-        api_timeout: int = 0,
-        stride: list = [1, 1],
-        server: Union[str] = None,
-        **kwargs,
-    ):
-        """ Instantiate an ERDDAP topo data fetcher
-
-        Parameters
-        ----------
-        ds: str (optional), default: 'gebco'
-            Dataset to load:
-
-            - 'gebco' will load the GEBCO_2020 Grid, a continuous terrain model for oceans and land at 15 arc-second intervals
-        stride: list, default [1, 1]
-            Strides along longitude and latitude. This allows to change the output resolution
-        cache: bool (optional)
-            Cache data or not (default: False)
-        cachedir: str (optional)
-            Path to cache folder
-        api_timeout: int (optional)
-            Erddap request time out in seconds. Set to OPTIONS['api_timeout'] by default.
-        """
-        from .stores import httpstore
-        timeout = OPTIONS["api_timeout"] if api_timeout == 0 else api_timeout
-        self.fs = httpstore(
-            cache=cache, cachedir=cachedir, timeout=timeout, size_policy="head"
-        )
-        self.definition = "Erddap topographic data fetcher"
-
-        self.BOX = box
-        self.stride = stride
-        if ds == "gebco":
-            self.definition = "NOAA erddap gebco data fetcher for a space region"
-            self.server = server if server is not None else "https://coastwatch.pfeg.noaa.gov/erddap"
-            self.server_name = "NOAA"
-            self.dataset_id = "gebco"
-
-        self._init_erddap()
-
-    def _init_erddap(self):
-        # Init erddap
-        self.erddap = self.ERDDAP(server=self.server, protocol="griddap")
-        self.erddap.response = "nc"
-
-        if self.dataset_id == "gebco":
-            self.erddap.dataset_id = "GEBCO_2020"
-        else:
-            raise ValueError(
-                "Invalid database short name for %s erddap" % self.server_name
-            )
-        return self
-
-    def _cname(self) -> str:
-        """ Fetcher one line string definition helper """
-        cname = "?"
-
-        if hasattr(self, "BOX"):
-            BOX = self.BOX
-            cname = ("[x=%0.2f/%0.2f; y=%0.2f/%0.2f]") % (
-                BOX[0],
-                BOX[1],
-                BOX[2],
-                BOX[3],
-            )
-        return cname
-
-    def __repr__(self):
-        summary = ["<topofetcher.erddap>"]
-        summary.append("Name: %s" % self.definition)
-        summary.append("API: %s" % self.server)
-        summary.append("Domain: %s" % format_oneline(self.cname()))
-        return "\n".join(summary)
-
-    def cname(self):
-        """ Return a unique string defining the constraints """
-        return self._cname()
-
-    @property
-    def cachepath(self):
-        """ Return path to cached file(s) for this request
-
-        Returns
-        -------
-        list(str)
-        """
-        return [self.fs.cachepath(uri) for uri in self.uri]
-
-    def define_constraints(self):
-        """ Define request constraints """
-        #        Eg: https://coastwatch.pfeg.noaa.gov/erddap/griddap/GEBCO_2020.nc?elevation%5B(34):5:(42)%5D%5B(-21):7:(-12)%5D
-        self.erddap.constraints = "%s(%0.2f):%i:(%0.2f)%s%s(%0.2f):%i:(%0.2f)%s" % (
-            "%5B",
-            self.BOX[2],
-            self.stride[1],
-            self.BOX[3],
-            "%5D",
-            "%5B",
-            self.BOX[0],
-            self.stride[0],
-            self.BOX[1],
-            "%5D",
-        )
-        return None
-
-    #     @property
-    #     def _minimal_vlist(self):
-    #         """ Return the minimal list of variables to retrieve """
-    #         vlist = list()
-    #         vlist.append("latitude")
-    #         vlist.append("longitude")
-    #         vlist.append("elevation")
-    #         return vlist
-
-    def url_encode(self, url):
-        """ Return safely encoded list of urls
-
-            This is necessary because fsspec cannot handle in cache paths/urls with a '[' character
-        """
-
-        # return urls
-        def safe_for_fsspec_cache(url):
-            url = url.replace("[", "%5B")  # This is the one really necessary
-            url = url.replace("]", "%5D")  # For consistency
-            return url
-
-        return safe_for_fsspec_cache(url)
-
-    def get_url(self):
-        """ Return the URL to download data requested
-
-        Returns
-        -------
-        str
-        """
-        # First part of the URL:
-        protocol = self.erddap.protocol
-        dataset_id = self.erddap.dataset_id
-        response = self.erddap.response
-        url = f"{self.erddap.server}/{protocol}/{dataset_id}.{response}?"
-
-        # Add variables to retrieve:
-        variables = ["elevation"]
-        variables = ",".join(variables)
-        url += f"{variables}"
-
-        # Add constraints:
-        self.define_constraints()  # Define constraint to select this box of data (affect self.erddap.constraints)
-        url += f"{self.erddap.constraints}"
-
-        return self.url_encode(url)
-
-    @property
-    def uri(self):
-        """ List of files to load for a request
-
-        Returns
-        -------
-        list(str)
-        """
-        return [self.get_url()]
-
-    def to_xarray(self, errors: str = "ignore"):
-        """ Load Topographic data and return a xarray.DataSet """
-
-        # Download data
-        if len(self.uri) == 1:
-            ds = self.fs.open_dataset(self.uri[0])
-
-        return ds
-
-    def load(self, errors: str = "ignore"):
-        """ Load Topographic data and return a xarray.DataSet """
-        return self.to_xarray(errors=errors)
-
-
 def argo_split_path(this_path):  # noqa C901
     """ Split path from a GDAC ftp style Argo netcdf file and return information
 

From beae1af4c5e63e5e8c22a91088d9573059ca67eb Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Wed, 6 Sep 2023 16:04:33 +0200
Subject: [PATCH 03/33] [skip-ci]

---
 argopy/__init__.py                        |   4 +-
 argopy/related/__init__.py                |   4 +-
 argopy/related/ocean_ops_deployments.py   | 377 ++++++++++++++++++++++
 argopy/related/{topo.py => topography.py} |   0
 argopy/utilities.py                       | 372 ---------------------
 5 files changed, 382 insertions(+), 375 deletions(-)
 create mode 100644 argopy/related/ocean_ops_deployments.py
 rename argopy/related/{topo.py => topography.py} (100%)

diff --git a/argopy/__init__.py b/argopy/__init__.py
index 7a90d217..8c8f6cf7 100644
--- a/argopy/__init__.py
+++ b/argopy/__init__.py
@@ -35,13 +35,13 @@
 from . import plot  # noqa: E402
 from .plot import dashboard, ArgoColors  # noqa: E402
 from .utilities import show_versions, show_options, clear_cache, lscache  # noqa: E402
-from .utilities import ArgoNVSReferenceTables, OceanOPSDeployments, ArgoDocs  # noqa: E402
+from .utilities import ArgoNVSReferenceTables, ArgoDocs  # noqa: E402
 from .utilities import monitor_status as status  # noqa: E402
 from .options import set_options, reset_options  # noqa: E402
 from .data_fetchers import CTDRefDataFetcher  # noqa: E402
 from .stores import ArgoIndex  # noqa: E402
 from .utils import compute  # noqa: E402, F401
-from .related import TopoFetcher # noqa: E402
+from .related import TopoFetcher, OceanOPSDeployments # noqa: E402
 
 #
 __all__ = (
diff --git a/argopy/related/__init__.py b/argopy/related/__init__.py
index 58c3812e..f2c85631 100644
--- a/argopy/related/__init__.py
+++ b/argopy/related/__init__.py
@@ -1,7 +1,9 @@
-from .topo import TopoFetcher
+from .topography import TopoFetcher
+from .ocean_ops_deployments import OceanOPSDeployments
 
 #
 __all__ = (
     # Classes:
     "TopoFetcher",
+    "OceanOPSDeployments",
 )
\ No newline at end of file
diff --git a/argopy/related/ocean_ops_deployments.py b/argopy/related/ocean_ops_deployments.py
new file mode 100644
index 00000000..a1a2dea6
--- /dev/null
+++ b/argopy/related/ocean_ops_deployments.py
@@ -0,0 +1,377 @@
+import pandas as pd
+import numpy as np
+from ..stores import httpstore
+from ..errors import DataNotFound
+from ..plot import scatter_map
+
+
+class OceanOPSDeployments:
+    """Use the OceanOPS API for metadata access to retrieve Argo floats deployment information.
+
+    The API is documented here: https://www.ocean-ops.org/api/swagger/?url=https://www.ocean-ops.org/api/1/oceanops-api.yaml
+
+    Description of deployment status name:
+
+    =========== == ====
+    Status      Id Description
+    =========== == ====
+    PROBABLE    0  Starting status for some platforms, when there is only a few metadata available, like rough deployment location and date. The platform may be deployed
+    CONFIRMED   1  Automatically set when a ship is attached to the deployment information. The platform is ready to be deployed, deployment is planned
+    REGISTERED  2  Starting status for most of the networks, when deployment planning is not done. The deployment is certain, and a notification has been sent via the OceanOPS system
+    OPERATIONAL 6  Automatically set when the platform is emitting a pulse and observations are distributed within a certain time interval
+    INACTIVE    4  The platform is not emitting a pulse since a certain time
+    CLOSED      5  The platform is not emitting a pulse since a long time, it is considered as dead
+    =========== == ====
+
+    Examples
+    --------
+
+    Import the class:
+
+    >>> from argopy.related import OceanOPSDeployments
+    >>> from argopy import OceanOPSDeployments
+
+    Possibly define the space/time box to work with:
+
+    >>> box = [-20, 0, 42, 51]
+    >>> box = [-20, 0, 42, 51, '2020-01', '2021-01']
+    >>> box = [-180, 180, -90, 90, '2020-01', None]
+
+    Instantiate the metadata fetcher:
+
+    >>> deployment = OceanOPSDeployments()
+    >>> deployment = OceanOPSDeployments(box)
+    >>> deployment = OceanOPSDeployments(box, deployed_only=True) # Remove planification
+
+    Load information:
+
+    >>> df = deployment.to_dataframe()
+    >>> data = deployment.to_json()
+
+    Useful attributes and methods:
+
+    >>> deployment.uri
+    >>> deployment.uri_decoded
+    >>> deployment.status_code
+    >>> fig, ax = deployment.plot_status()
+    >>> plan_virtualfleet = deployment.plan
+
+    """
+    api = "https://www.ocean-ops.org"
+    """URL to the API"""
+
+    model = "api/1/data/platform"
+    """This model represents a Platform entity and is used to retrieve a platform information (schema model
+     named 'Ptf')."""
+
+    api_server_check = 'https://www.ocean-ops.org/api/1/oceanops-api.yaml'
+    """URL to check if the API is alive"""
+
+    def __init__(self, box: list = None, deployed_only: bool = False):
+        """
+
+        Parameters
+        ----------
+        box: list, optional, default=None
+            Define the domain to load the Argo deployment plan for. By default, **box** is set to None to work with the
+            global deployment plan starting from the current date.
+            The list expects one of the following format:
+
+            - [lon_min, lon_max, lat_min, lat_max]
+            - [lon_min, lon_max, lat_min, lat_max, date_min]
+            - [lon_min, lon_max, lat_min, lat_max, date_min, date_max]
+
+            Longitude and latitude values must be floats. Dates are strings.
+            If **box** is provided with a regional domain definition (only 4 values given), then ``date_min`` will be
+            set to the current date.
+
+        deployed_only: bool, optional, default=False
+            Return only floats already deployed. If set to False (default), will return the full
+            deployment plan (floats with all possible status). If set to True, will return only floats with one of the
+            following status: ``OPERATIONAL``, ``INACTIVE``, and ``CLOSED``.
+        """
+        if box is None:
+            box = [None, None, None, None, pd.to_datetime('now', utc=True).strftime("%Y-%m-%d"), None]
+        elif len(box) == 4:
+            box.append(pd.to_datetime('now', utc=True).strftime("%Y-%m-%d"))
+            box.append(None)
+        elif len(box) == 5:
+            box.append(None)
+
+        if len(box) != 6:
+            raise ValueError("The 'box' argument must be: None or of lengths 4 or 5 or 6\n%s" % str(box))
+
+        self.box = box
+        self.deployed_only = deployed_only
+        self.data = None
+
+        self.fs = httpstore(cache=False)
+
+    def __format(self, x, typ: str) -> str:
+        """ string formatting helper """
+        if typ == "lon":
+            return str(x) if x is not None else "-"
+        elif typ == "lat":
+            return str(x) if x is not None else "-"
+        elif typ == "tim":
+            return pd.to_datetime(x).strftime("%Y-%m-%d") if x is not None else "-"
+        else:
+            return str(x)
+
+    def __repr__(self):
+        summary = ["<argo.deployment_plan>"]
+        summary.append("API: %s/%s" % (self.api, self.model))
+        summary.append("Domain: %s" % self.box_name)
+        summary.append("Deployed only: %s" % self.deployed_only)
+        if self.data is not None:
+            summary.append("Nb of floats in the deployment plan: %s" % self.size)
+        else:
+            summary.append("Nb of floats in the deployment plan: - [Data not retrieved yet]")
+        return '\n'.join(summary)
+
+    def __encode_inc(self, inc):
+        """Return encoded uri expression for 'include' parameter
+
+        Parameters
+        ----------
+        inc: str
+
+        Returns
+        -------
+        str
+        """
+        return inc.replace("\"", "%22").replace("[", "%5B").replace("]", "%5D")
+
+    def __encode_exp(self, exp):
+        """Return encoded uri expression for 'exp' parameter
+
+        Parameters
+        ----------
+        exp: str
+
+        Returns
+        -------
+        str
+        """
+        return exp.replace("\"", "%22").replace("'", "%27").replace(" ", "%20").replace(">", "%3E").replace("<", "%3C")
+
+    def __get_uri(self, encoded=False):
+        uri = "exp=%s&include=%s" % (self.exp(encoded=encoded), self.include(encoded=encoded))
+        url = "%s/%s?%s" % (self.api, self.model, uri)
+        return url
+
+    def include(self, encoded=False):
+        """Return an Ocean-Ops API 'include' expression
+
+        This is used to determine which variables the API call should return
+
+        Parameters
+        ----------
+        encoded: bool, default=False
+
+        Returns
+        -------
+        str
+        """
+        # inc = ["ref", "ptfDepl.lat", "ptfDepl.lon", "ptfDepl.deplDate", "ptfStatus", "wmos"]
+        # inc = ["ref", "ptfDepl.lat", "ptfDepl.lon", "ptfDepl.deplDate", "ptfStatus.id", "ptfStatus.name", "wmos"]
+        # inc = ["ref", "ptfDepl.lat", "ptfDepl.lon", "ptfDepl.deplDate", "ptfStatus.id", "ptfStatus.name"]
+        inc = ["ref", "ptfDepl.lat", "ptfDepl.lon", "ptfDepl.deplDate", "ptfStatus.id", "ptfStatus.name",
+               "ptfStatus.description",
+               "program.nameShort", "program.country.nameShort", "ptfModel.nameShort", "ptfDepl.noSite"]
+        inc = "[%s]" % ",".join(["\"%s\"" % v for v in inc])
+        return inc if not encoded else self.__encode_inc(inc)
+
+    def exp(self, encoded=False):
+        """Return an Ocean-Ops API deployment search expression for an argopy region box definition
+
+        Parameters
+        ----------
+        encoded: bool, default=False
+
+        Returns
+        -------
+        str
+        """
+        exp, arg = "networkPtfs.network.name='Argo'", []
+        if self.box[0] is not None:
+            exp += " and ptfDepl.lon>=$var%i" % (len(arg) + 1)
+            arg.append(str(self.box[0]))
+        if self.box[1] is not None:
+            exp += " and ptfDepl.lon<=$var%i" % (len(arg) + 1)
+            arg.append(str(self.box[1]))
+        if self.box[2] is not None:
+            exp += " and ptfDepl.lat>=$var%i" % (len(arg) + 1)
+            arg.append(str(self.box[2]))
+        if self.box[3] is not None:
+            exp += " and ptfDepl.lat<=$var%i" % (len(arg) + 1)
+            arg.append(str(self.box[3]))
+        if len(self.box) > 4:
+            if self.box[4] is not None:
+                exp += " and ptfDepl.deplDate>=$var%i" % (len(arg) + 1)
+                arg.append("\"%s\"" % pd.to_datetime(self.box[4]).strftime("%Y-%m-%d %H:%M:%S"))
+            if self.box[5] is not None:
+                exp += " and ptfDepl.deplDate<=$var%i" % (len(arg) + 1)
+                arg.append("\"%s\"" % pd.to_datetime(self.box[5]).strftime("%Y-%m-%d %H:%M:%S"))
+
+        if self.deployed_only:
+            exp += " and ptfStatus>=$var%i" % (len(arg) + 1)
+            arg.append(str(4))  # Allow for: 4, 5 or 6
+
+        exp = "[\"%s\", %s]" % (exp, ", ".join(arg))
+        return exp if not encoded else self.__encode_exp(exp)
+
+    @property
+    def size(self):
+        return len(self.data['data']) if self.data is not None else None
+
+    @property
+    def status_code(self):
+        """Return a :class:`pandas.DataFrame` with the definition of status"""
+        status = {'status_code': [0, 1, 2, 6, 4, 5],
+                  'status_name': ['PROBABLE', 'CONFIRMED', 'REGISTERED', 'OPERATIONAL', 'INACTIVE', 'CLOSED'],
+                  'description': [
+                      'Starting status for some platforms, when there is only a few metadata available, like rough deployment location and date. The platform may be deployed',
+                      'Automatically set when a ship is attached to the deployment information. The platform is ready to be deployed, deployment is planned',
+                      'Starting status for most of the networks, when deployment planning is not done. The deployment is certain, and a notification has been sent via the OceanOPS system',
+                      'Automatically set when the platform is emitting a pulse and observations are distributed within a certain time interval',
+                      'The platform is not emitting a pulse since a certain time',
+                      'The platform is not emitting a pulse since a long time, it is considered as dead',
+                    ],
+                  }
+        return pd.DataFrame(status).set_index('status_code')
+
+    @property
+    def box_name(self):
+        """Return a string to print the box property"""
+        BOX = self.box
+        cname = ("[lon=%s/%s; lat=%s/%s]") % (
+            self.__format(BOX[0], "lon"),
+            self.__format(BOX[1], "lon"),
+            self.__format(BOX[2], "lat"),
+            self.__format(BOX[3], "lat"),
+        )
+        if len(BOX) == 6:
+            cname = ("[lon=%s/%s; lat=%s/%s; t=%s/%s]") % (
+                self.__format(BOX[0], "lon"),
+                self.__format(BOX[1], "lon"),
+                self.__format(BOX[2], "lat"),
+                self.__format(BOX[3], "lat"),
+                self.__format(BOX[4], "tim"),
+                self.__format(BOX[5], "tim"),
+            )
+        return cname
+
+    @property
+    def uri(self):
+        """Return encoded URL to post an Ocean-Ops API request
+
+        Returns
+        -------
+        str
+        """
+        return self.__get_uri(encoded=True)
+
+    @property
+    def uri_decoded(self):
+        """Return decoded URL to post an Ocean-Ops API request
+
+        Returns
+        -------
+        str
+        """
+        return self.__get_uri(encoded=False)
+
+    @property
+    def plan(self):
+        """Return a dictionary to be used as argument in a :class:`virtualargofleet.VirtualFleet`
+
+        This method is for dev, but will be moved to the VirtualFleet software utilities
+        """
+        df = self.to_dataframe()
+        plan = df[['lon', 'lat', 'date']].rename(columns={"date": "time"}).to_dict('series')
+        for key in plan.keys():
+            plan[key] = plan[key].to_list()
+        plan['time'] = np.array(plan['time'], dtype='datetime64')
+        return plan
+
+    def to_json(self):
+        """Return OceanOPS API request response as a json object"""
+        if self.data is None:
+            self.data = self.fs.open_json(self.uri)
+        return self.data
+
+    def to_dataframe(self):
+        """Return the deployment plan as :class:`pandas.DataFrame`
+
+        Returns
+        -------
+        :class:`pandas.DataFrame`
+        """
+        data = self.to_json()
+        if data['total'] == 0:
+            raise DataNotFound('Your search matches no results')
+
+        # res = {'date': [], 'lat': [], 'lon': [], 'wmo': [], 'status_name': [], 'status_code': []}
+        # res = {'date': [], 'lat': [], 'lon': [], 'wmo': [], 'status_name': [], 'status_code': [], 'ship_name': []}
+        res = {'date': [], 'lat': [], 'lon': [], 'wmo': [], 'status_name': [], 'status_code': [], 'program': [],
+               'country': [], 'model': []}
+        # status = {'REGISTERED': None, 'OPERATIONAL': None, 'INACTIVE': None, 'CLOSED': None,
+        #           'CONFIRMED': None, 'OPERATIONAL': None, 'PROBABLE': None, 'REGISTERED': None}
+
+        for irow, ptf in enumerate(data['data']):
+            # if irow == 0:
+            # print(ptf)
+            res['lat'].append(ptf['ptfDepl']['lat'])
+            res['lon'].append(ptf['ptfDepl']['lon'])
+            res['date'].append(ptf['ptfDepl']['deplDate'])
+            res['wmo'].append(ptf['ref'])
+            # res['wmo'].append(ptf['wmos'][-1]['wmo'])
+            # res['wmo'].append(float_wmo(ptf['ref'])) # will not work for some CONFIRMED, PROBABLE or REGISTERED floats
+            # res['wmo'].append(float_wmo(ptf['wmos'][-1]['wmo']))
+            res['status_code'].append(ptf['ptfStatus']['id'])
+            res['status_name'].append(ptf['ptfStatus']['name'])
+
+            # res['ship_name'].append(ptf['ptfDepl']['shipName'])
+            program = ptf['program']['nameShort'].replace("_", " ") if ptf['program']['nameShort'] else ptf['program'][
+                'nameShort']
+            res['program'].append(program)
+            res['country'].append(ptf['program']['country']['nameShort'])
+            res['model'].append(ptf['ptfModel']['nameShort'])
+
+            # if status[ptf['ptfStatus']['name']] is None:
+            #     status[ptf['ptfStatus']['name']] = ptf['ptfStatus']['description']
+
+        df = pd.DataFrame(res)
+        df = df.astype({'date': 'datetime64[s]'})
+        df = df.sort_values(by='date').reset_index(drop=True)
+        # df = df[ (df['status_name'] == 'CLOSED') | (df['status_name'] == 'OPERATIONAL')] # Select only floats that have been deployed and returned data
+        # print(status)
+        return df
+
+    def plot_status(self,
+                    **kwargs
+                    ):
+        """Quick plot of the deployment plan
+
+        Named arguments are passed to :class:`plot.scatter_map`
+
+        Returns
+        -------
+        fig: :class:`matplotlib.figure.Figure`
+        ax: :class:`matplotlib.axes.Axes`
+        """
+        df = self.to_dataframe()
+        fig, ax = scatter_map(df,
+                              x='lon',
+                              y='lat',
+                              hue='status_code',
+                              traj=False,
+                              cmap='deployment_status',
+                              **kwargs)
+        ax.set_title("Argo network deployment plan\n%s\nSource: OceanOPS API as of %s"
+                     % (self.box_name, pd.to_datetime('now', utc=True).strftime("%Y-%m-%d %H:%M:%S")),
+                     fontsize=12
+                     )
+        return fig, ax
+
diff --git a/argopy/related/topo.py b/argopy/related/topography.py
similarity index 100%
rename from argopy/related/topo.py
rename to argopy/related/topography.py
diff --git a/argopy/utilities.py b/argopy/utilities.py
index 9ff569f9..fc6c8e37 100644
--- a/argopy/utilities.py
+++ b/argopy/utilities.py
@@ -2941,378 +2941,6 @@ def all_tbl_name(self):
         return all_tables
 
 
-class OceanOPSDeployments:
-    """Use the OceanOPS API for metadata access to retrieve Argo floats deployment information.
-
-    The API is documented here: https://www.ocean-ops.org/api/swagger/?url=https://www.ocean-ops.org/api/1/oceanops-api.yaml
-
-    Description of deployment status name:
-
-    =========== == ====
-    Status      Id Description
-    =========== == ====
-    PROBABLE    0  Starting status for some platforms, when there is only a few metadata available, like rough deployment location and date. The platform may be deployed
-    CONFIRMED   1  Automatically set when a ship is attached to the deployment information. The platform is ready to be deployed, deployment is planned
-    REGISTERED  2  Starting status for most of the networks, when deployment planning is not done. The deployment is certain, and a notification has been sent via the OceanOPS system
-    OPERATIONAL 6  Automatically set when the platform is emitting a pulse and observations are distributed within a certain time interval
-    INACTIVE    4  The platform is not emitting a pulse since a certain time
-    CLOSED      5  The platform is not emitting a pulse since a long time, it is considered as dead
-    =========== == ====
-
-    Examples
-    --------
-
-    Import the utility class:
-
-    >>> from argopy.utilities import OceanOPSDeployments
-    >>> from argopy import OceanOPSDeployments
-
-    Possibly define the space/time box to work with:
-
-    >>> box = [-20, 0, 42, 51]
-    >>> box = [-20, 0, 42, 51, '2020-01', '2021-01']
-    >>> box = [-180, 180, -90, 90, '2020-01', None]
-
-    Instantiate the metadata fetcher:
-
-    >>> deployment = OceanOPSDeployments()
-    >>> deployment = OceanOPSDeployments(box)
-    >>> deployment = OceanOPSDeployments(box, deployed_only=True) # Remove planification
-
-    Load information:
-
-    >>> df = deployment.to_dataframe()
-    >>> data = deployment.to_json()
-
-    Useful attributes and methods:
-
-    >>> deployment.uri
-    >>> deployment.uri_decoded
-    >>> deployment.status_code
-    >>> fig, ax = deployment.plot_status()
-    >>> plan_virtualfleet = deployment.plan
-
-    """
-    api = "https://www.ocean-ops.org"
-    """URL to the API"""
-
-    model = "api/1/data/platform"
-    """This model represents a Platform entity and is used to retrieve a platform information (schema model
-     named 'Ptf')."""
-
-    api_server_check = 'https://www.ocean-ops.org/api/1/oceanops-api.yaml'
-    """URL to check if the API is alive"""
-
-    def __init__(self, box: list = None, deployed_only: bool = False):
-        """
-
-        Parameters
-        ----------
-        box: list, optional, default=None
-            Define the domain to load the Argo deployment plan for. By default, **box** is set to None to work with the
-            global deployment plan starting from the current date.
-            The list expects one of the following format:
-
-            - [lon_min, lon_max, lat_min, lat_max]
-            - [lon_min, lon_max, lat_min, lat_max, date_min]
-            - [lon_min, lon_max, lat_min, lat_max, date_min, date_max]
-
-            Longitude and latitude values must be floats. Dates are strings.
-            If **box** is provided with a regional domain definition (only 4 values given), then ``date_min`` will be
-            set to the current date.
-
-        deployed_only: bool, optional, default=False
-            Return only floats already deployed. If set to False (default), will return the full
-            deployment plan (floats with all possible status). If set to True, will return only floats with one of the
-            following status: ``OPERATIONAL``, ``INACTIVE``, and ``CLOSED``.
-        """
-        if box is None:
-            box = [None, None, None, None, pd.to_datetime('now', utc=True).strftime("%Y-%m-%d"), None]
-        elif len(box) == 4:
-            box.append(pd.to_datetime('now', utc=True).strftime("%Y-%m-%d"))
-            box.append(None)
-        elif len(box) == 5:
-            box.append(None)
-
-        if len(box) != 6:
-            raise ValueError("The 'box' argument must be: None or of lengths 4 or 5 or 6\n%s" % str(box))
-
-        self.box = box
-        self.deployed_only = deployed_only
-        self.data = None
-
-        from .stores import httpstore
-        self.fs = httpstore(cache=False)
-
-    def __format(self, x, typ: str) -> str:
-        """ string formatting helper """
-        if typ == "lon":
-            return str(x) if x is not None else "-"
-        elif typ == "lat":
-            return str(x) if x is not None else "-"
-        elif typ == "tim":
-            return pd.to_datetime(x).strftime("%Y-%m-%d") if x is not None else "-"
-        else:
-            return str(x)
-
-    def __repr__(self):
-        summary = ["<argo.deployment_plan>"]
-        summary.append("API: %s/%s" % (self.api, self.model))
-        summary.append("Domain: %s" % self.box_name)
-        summary.append("Deployed only: %s" % self.deployed_only)
-        if self.data is not None:
-            summary.append("Nb of floats in the deployment plan: %s" % self.size)
-        else:
-            summary.append("Nb of floats in the deployment plan: - [Data not retrieved yet]")
-        return '\n'.join(summary)
-
-    def __encode_inc(self, inc):
-        """Return encoded uri expression for 'include' parameter
-
-        Parameters
-        ----------
-        inc: str
-
-        Returns
-        -------
-        str
-        """
-        return inc.replace("\"", "%22").replace("[", "%5B").replace("]", "%5D")
-
-    def __encode_exp(self, exp):
-        """Return encoded uri expression for 'exp' parameter
-
-        Parameters
-        ----------
-        exp: str
-
-        Returns
-        -------
-        str
-        """
-        return exp.replace("\"", "%22").replace("'", "%27").replace(" ", "%20").replace(">", "%3E").replace("<", "%3C")
-
-    def __get_uri(self, encoded=False):
-        uri = "exp=%s&include=%s" % (self.exp(encoded=encoded), self.include(encoded=encoded))
-        url = "%s/%s?%s" % (self.api, self.model, uri)
-        return url
-
-    def include(self, encoded=False):
-        """Return an Ocean-Ops API 'include' expression
-
-        This is used to determine which variables the API call should return
-
-        Parameters
-        ----------
-        encoded: bool, default=False
-
-        Returns
-        -------
-        str
-        """
-        # inc = ["ref", "ptfDepl.lat", "ptfDepl.lon", "ptfDepl.deplDate", "ptfStatus", "wmos"]
-        # inc = ["ref", "ptfDepl.lat", "ptfDepl.lon", "ptfDepl.deplDate", "ptfStatus.id", "ptfStatus.name", "wmos"]
-        # inc = ["ref", "ptfDepl.lat", "ptfDepl.lon", "ptfDepl.deplDate", "ptfStatus.id", "ptfStatus.name"]
-        inc = ["ref", "ptfDepl.lat", "ptfDepl.lon", "ptfDepl.deplDate", "ptfStatus.id", "ptfStatus.name",
-               "ptfStatus.description",
-               "program.nameShort", "program.country.nameShort", "ptfModel.nameShort", "ptfDepl.noSite"]
-        inc = "[%s]" % ",".join(["\"%s\"" % v for v in inc])
-        return inc if not encoded else self.__encode_inc(inc)
-
-    def exp(self, encoded=False):
-        """Return an Ocean-Ops API deployment search expression for an argopy region box definition
-
-        Parameters
-        ----------
-        encoded: bool, default=False
-
-        Returns
-        -------
-        str
-        """
-        exp, arg = "networkPtfs.network.name='Argo'", []
-        if self.box[0] is not None:
-            exp += " and ptfDepl.lon>=$var%i" % (len(arg) + 1)
-            arg.append(str(self.box[0]))
-        if self.box[1] is not None:
-            exp += " and ptfDepl.lon<=$var%i" % (len(arg) + 1)
-            arg.append(str(self.box[1]))
-        if self.box[2] is not None:
-            exp += " and ptfDepl.lat>=$var%i" % (len(arg) + 1)
-            arg.append(str(self.box[2]))
-        if self.box[3] is not None:
-            exp += " and ptfDepl.lat<=$var%i" % (len(arg) + 1)
-            arg.append(str(self.box[3]))
-        if len(self.box) > 4:
-            if self.box[4] is not None:
-                exp += " and ptfDepl.deplDate>=$var%i" % (len(arg) + 1)
-                arg.append("\"%s\"" % pd.to_datetime(self.box[4]).strftime("%Y-%m-%d %H:%M:%S"))
-            if self.box[5] is not None:
-                exp += " and ptfDepl.deplDate<=$var%i" % (len(arg) + 1)
-                arg.append("\"%s\"" % pd.to_datetime(self.box[5]).strftime("%Y-%m-%d %H:%M:%S"))
-
-        if self.deployed_only:
-            exp += " and ptfStatus>=$var%i" % (len(arg) + 1)
-            arg.append(str(4))  # Allow for: 4, 5 or 6
-
-        exp = "[\"%s\", %s]" % (exp, ", ".join(arg))
-        return exp if not encoded else self.__encode_exp(exp)
-
-    @property
-    def size(self):
-        return len(self.data['data']) if self.data is not None else None
-
-    @property
-    def status_code(self):
-        """Return a :class:`pandas.DataFrame` with the definition of status"""
-        status = {'status_code': [0, 1, 2, 6, 4, 5],
-                  'status_name': ['PROBABLE', 'CONFIRMED', 'REGISTERED', 'OPERATIONAL', 'INACTIVE', 'CLOSED'],
-                  'description': [
-                      'Starting status for some platforms, when there is only a few metadata available, like rough deployment location and date. The platform may be deployed',
-                      'Automatically set when a ship is attached to the deployment information. The platform is ready to be deployed, deployment is planned',
-                      'Starting status for most of the networks, when deployment planning is not done. The deployment is certain, and a notification has been sent via the OceanOPS system',
-                      'Automatically set when the platform is emitting a pulse and observations are distributed within a certain time interval',
-                      'The platform is not emitting a pulse since a certain time',
-                      'The platform is not emitting a pulse since a long time, it is considered as dead',
-                    ],
-                  }
-        return pd.DataFrame(status).set_index('status_code')
-
-    @property
-    def box_name(self):
-        """Return a string to print the box property"""
-        BOX = self.box
-        cname = ("[lon=%s/%s; lat=%s/%s]") % (
-            self.__format(BOX[0], "lon"),
-            self.__format(BOX[1], "lon"),
-            self.__format(BOX[2], "lat"),
-            self.__format(BOX[3], "lat"),
-        )
-        if len(BOX) == 6:
-            cname = ("[lon=%s/%s; lat=%s/%s; t=%s/%s]") % (
-                self.__format(BOX[0], "lon"),
-                self.__format(BOX[1], "lon"),
-                self.__format(BOX[2], "lat"),
-                self.__format(BOX[3], "lat"),
-                self.__format(BOX[4], "tim"),
-                self.__format(BOX[5], "tim"),
-            )
-        return cname
-
-    @property
-    def uri(self):
-        """Return encoded URL to post an Ocean-Ops API request
-
-        Returns
-        -------
-        str
-        """
-        return self.__get_uri(encoded=True)
-
-    @property
-    def uri_decoded(self):
-        """Return decoded URL to post an Ocean-Ops API request
-
-        Returns
-        -------
-        str
-        """
-        return self.__get_uri(encoded=False)
-
-    @property
-    def plan(self):
-        """Return a dictionary to be used as argument in a :class:`virtualargofleet.VirtualFleet`
-
-        This method is for dev, but will be moved to the VirtualFleet software utilities
-        """
-        df = self.to_dataframe()
-        plan = df[['lon', 'lat', 'date']].rename(columns={"date": "time"}).to_dict('series')
-        for key in plan.keys():
-            plan[key] = plan[key].to_list()
-        plan['time'] = np.array(plan['time'], dtype='datetime64')
-        return plan
-
-    def to_json(self):
-        """Return OceanOPS API request response as a json object"""
-        if self.data is None:
-            self.data = self.fs.open_json(self.uri)
-        return self.data
-
-    def to_dataframe(self):
-        """Return the deployment plan as :class:`pandas.DataFrame`
-
-        Returns
-        -------
-        :class:`pandas.DataFrame`
-        """
-        data = self.to_json()
-        if data['total'] == 0:
-            raise DataNotFound('Your search matches no results')
-
-        # res = {'date': [], 'lat': [], 'lon': [], 'wmo': [], 'status_name': [], 'status_code': []}
-        # res = {'date': [], 'lat': [], 'lon': [], 'wmo': [], 'status_name': [], 'status_code': [], 'ship_name': []}
-        res = {'date': [], 'lat': [], 'lon': [], 'wmo': [], 'status_name': [], 'status_code': [], 'program': [],
-               'country': [], 'model': []}
-        # status = {'REGISTERED': None, 'OPERATIONAL': None, 'INACTIVE': None, 'CLOSED': None,
-        #           'CONFIRMED': None, 'OPERATIONAL': None, 'PROBABLE': None, 'REGISTERED': None}
-
-        for irow, ptf in enumerate(data['data']):
-            # if irow == 0:
-            # print(ptf)
-            res['lat'].append(ptf['ptfDepl']['lat'])
-            res['lon'].append(ptf['ptfDepl']['lon'])
-            res['date'].append(ptf['ptfDepl']['deplDate'])
-            res['wmo'].append(ptf['ref'])
-            # res['wmo'].append(ptf['wmos'][-1]['wmo'])
-            # res['wmo'].append(float_wmo(ptf['ref'])) # will not work for some CONFIRMED, PROBABLE or REGISTERED floats
-            # res['wmo'].append(float_wmo(ptf['wmos'][-1]['wmo']))
-            res['status_code'].append(ptf['ptfStatus']['id'])
-            res['status_name'].append(ptf['ptfStatus']['name'])
-
-            # res['ship_name'].append(ptf['ptfDepl']['shipName'])
-            program = ptf['program']['nameShort'].replace("_", " ") if ptf['program']['nameShort'] else ptf['program'][
-                'nameShort']
-            res['program'].append(program)
-            res['country'].append(ptf['program']['country']['nameShort'])
-            res['model'].append(ptf['ptfModel']['nameShort'])
-
-            # if status[ptf['ptfStatus']['name']] is None:
-            #     status[ptf['ptfStatus']['name']] = ptf['ptfStatus']['description']
-
-        df = pd.DataFrame(res)
-        df = df.astype({'date': 'datetime64[s]'})
-        df = df.sort_values(by='date').reset_index(drop=True)
-        # df = df[ (df['status_name'] == 'CLOSED') | (df['status_name'] == 'OPERATIONAL')] # Select only floats that have been deployed and returned data
-        # print(status)
-        return df
-
-    def plot_status(self,
-                    **kwargs
-                    ):
-        """Quick plot of the deployment plan
-
-        Named arguments are passed to :class:`plot.scatter_map`
-
-        Returns
-        -------
-        fig: :class:`matplotlib.figure.Figure`
-        ax: :class:`matplotlib.axes.Axes`
-        """
-        from .plot.plot import scatter_map
-        df = self.to_dataframe()
-        fig, ax = scatter_map(df,
-                              x='lon',
-                              y='lat',
-                              hue='status_code',
-                              traj=False,
-                              cmap='deployment_status',
-                              **kwargs)
-        ax.set_title("Argo network deployment plan\n%s\nSource: OceanOPS API as of %s"
-                     % (self.box_name, pd.to_datetime('now', utc=True).strftime("%Y-%m-%d %H:%M:%S")),
-                     fontsize=12
-                     )
-        return fig, ax
-
 
 @deprecated
 def cast_types(ds):  # noqa: C901

From 3d3cff9f74583503dfaaa00358e617adbf7fdc06 Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Wed, 6 Sep 2023 16:15:44 +0200
Subject: [PATCH 04/33] [skip-ci]

---
 argopy/__init__.py                      |   4 +-
 argopy/related/__init__.py              |   4 +
 argopy/related/argo_documentation.py    | 348 ++++++++++++++
 argopy/related/ocean_ops_deployments.py | 193 +++++---
 argopy/related/reference_tables.py      | 245 ++++++++++
 argopy/related/topography.py            |  30 +-
 argopy/utilities.py                     | 583 ------------------------
 7 files changed, 744 insertions(+), 663 deletions(-)
 create mode 100644 argopy/related/argo_documentation.py
 create mode 100644 argopy/related/reference_tables.py

diff --git a/argopy/__init__.py b/argopy/__init__.py
index 8c8f6cf7..8f2c8392 100644
--- a/argopy/__init__.py
+++ b/argopy/__init__.py
@@ -35,13 +35,13 @@
 from . import plot  # noqa: E402
 from .plot import dashboard, ArgoColors  # noqa: E402
 from .utilities import show_versions, show_options, clear_cache, lscache  # noqa: E402
-from .utilities import ArgoNVSReferenceTables, ArgoDocs  # noqa: E402
+from .utilities import ArgoDocs  # noqa: E402
 from .utilities import monitor_status as status  # noqa: E402
 from .options import set_options, reset_options  # noqa: E402
 from .data_fetchers import CTDRefDataFetcher  # noqa: E402
 from .stores import ArgoIndex  # noqa: E402
 from .utils import compute  # noqa: E402, F401
-from .related import TopoFetcher, OceanOPSDeployments # noqa: E402
+from .related import TopoFetcher, OceanOPSDeployments, ArgoNVSReferenceTables  # noqa: E402
 
 #
 __all__ = (
diff --git a/argopy/related/__init__.py b/argopy/related/__init__.py
index f2c85631..bc82a46e 100644
--- a/argopy/related/__init__.py
+++ b/argopy/related/__init__.py
@@ -1,9 +1,13 @@
 from .topography import TopoFetcher
 from .ocean_ops_deployments import OceanOPSDeployments
+from .reference_tables import ArgoNVSReferenceTables
+from .argo_documentation import ArgoDocs
 
 #
 __all__ = (
     # Classes:
     "TopoFetcher",
     "OceanOPSDeployments",
+    "ArgoNVSReferenceTables",
+    "ArgoDocs",
 )
\ No newline at end of file
diff --git a/argopy/related/argo_documentation.py b/argopy/related/argo_documentation.py
new file mode 100644
index 00000000..0ed70a39
--- /dev/null
+++ b/argopy/related/argo_documentation.py
@@ -0,0 +1,348 @@
+import pandas as pd
+from functools import lru_cache
+from ..stores import httpstore
+from ..options import OPTIONS
+
+
+class ArgoDocs:
+    """ADMT documentation helper class
+
+    Examples
+    --------
+    >>> ArgoDocs().list
+    >>> ArgoDocs().search("CDOM")
+    >>> ArgoDocs().search("CDOM", where='abstract')
+
+    >>> ArgoDocs(35385)
+    >>> ArgoDocs(35385).ris
+    >>> ArgoDocs(35385).abstract
+    >>> ArgoDocs(35385).show()
+    >>> ArgoDocs(35385).open_pdf()
+    >>> ArgoDocs(35385).open_pdf(page=12)
+
+    """
+    _catalogue = [
+        {
+            "category": "Argo data formats",
+            "title": "Argo user's manual",
+            "doi": "10.13155/29825",
+            "id": 29825
+        },
+        {
+            "category": "Quality control",
+            "title": "Argo Quality Control Manual for CTD and Trajectory Data",
+            "doi": "10.13155/33951",
+            "id": 33951
+        },
+        {
+            "category": "Quality control",
+            "title": "Argo quality control manual for dissolved oxygen concentration",
+            "doi": "10.13155/46542",
+            "id": 46542
+        },
+        {
+            "category": "Quality control",
+            "title": "Argo quality control manual for biogeochemical data",
+            "doi": "10.13155/40879",
+            "id": 40879
+        },
+        {
+            "category": "Quality control",
+            "title": "BGC-Argo quality control manual for the Chlorophyll-A concentration",
+            "doi": "10.13155/35385",
+            "id": 35385
+        },
+        {
+            "category": "Quality control",
+            "title": "BGC-Argo quality control manual for nitrate concentration",
+            "doi": "10.13155/84370",
+            "id": 84370
+        },
+        {
+            "category": "Quality control",
+            "title": "Quality control for BGC-Argo radiometry",
+            "doi": "10.13155/62466",
+            "id": 62466
+        },
+        {
+            "category": "Cookbooks",
+            "title": "Argo DAC profile cookbook",
+            "doi": "10.13155/41151",
+            "id": 41151
+        },
+        {
+            "category": "Cookbooks",
+            "title": "Argo DAC trajectory cookbook",
+            "doi": "10.13155/29824",
+            "id": 29824
+        },
+        {
+            "category": "Cookbooks",
+            "title": "DMQC Cookbook for Core Argo parameters",
+            "doi": "10.13155/78994",
+            "id": 78994
+        },
+        {
+            "category": "Cookbooks",
+            "title": "Processing Argo oxygen data at the DAC level",
+            "doi": "10.13155/39795",
+            "id": 39795
+        },
+        {
+            "category": "Cookbooks",
+            "title": "Processing Bio-Argo particle backscattering at the DAC level",
+            "doi": "10.13155/39459",
+            "id": 39459
+        },
+        {
+            "category": "Cookbooks",
+            "title": "Processing BGC-Argo chlorophyll-A concentration at the DAC level",
+            "doi": "10.13155/39468",
+            "id": 39468
+        },
+        {
+            "category": "Cookbooks",
+            "title": "Processing Argo measurement timing information at the DAC level",
+            "doi": "10.13155/47998",
+            "id": 47998
+        },
+        {
+            "category": "Cookbooks",
+            "title": "Processing BGC-Argo CDOM concentration at the DAC level",
+            "doi": "10.13155/54541",
+            "id": 54541
+        },
+        {
+            "category": "Cookbooks",
+            "title": "Processing Bio-Argo nitrate concentration at the DAC Level",
+            "doi": "10.13155/46121",
+            "id": 46121
+        },
+        {
+            "category": "Cookbooks",
+            "title": "Processing BGC-Argo Radiometric data at the DAC level",
+            "doi": "10.13155/51541",
+            "id": 51541
+        },
+        {
+            "category": "Cookbooks",
+            "title": "Processing BGC-Argo pH data at the DAC level",
+            "doi": "10.13155/57195",
+            "id": 57195
+        },
+        {
+            "category": "Cookbooks",
+            "title": "Description of the Argo GDAC File Checks: Data Format and Consistency Checks",
+            "doi": "10.13155/46120",
+            "id": 46120
+        },
+        {
+            "category": "Cookbooks",
+            "title": "Description of the Argo GDAC File Merge Process",
+            "doi": "10.13155/52154",
+            "id": 52154
+        },
+        {
+            "category": "Cookbooks",
+            "title": "BGC-Argo synthetic profile file processing and format on Coriolis GDAC",
+            "doi": "10.13155/55637",
+            "id": 55637
+        },
+        {
+            "category": "Cookbooks",
+            "title": "Argo GDAC cookbook",
+            "doi": "10.13155/46202",
+            "id": 46202
+        }
+    ]
+
+    class RIS:
+        """RIS file structure from TXT file"""
+
+        def __init__(self, file=None, fs=None):
+            self.record = None
+            self.fs = fs
+            if file:
+                self.parse(file)
+
+        def parse(self, file):
+            """Parse input file"""
+            # log.debug(file)
+
+            with self.fs.open(file, 'r', encoding="utf-8") as f:
+                TXTlines = f.readlines()
+            lines = []
+            # Eliminate blank lines
+            for line in TXTlines:
+                line = line.strip()
+                if len(line) > 0:
+                    lines.append(line)
+            TXTlines = lines
+
+            #
+            record = {}
+            for line in TXTlines:
+                # print("\n>", line)
+                if len(line) > 2:
+                    if line[2] == " ":
+                        tag = line[0:2]
+                        field = line[3:]
+                        # print("ok", {tag: field})
+                        record[tag] = [field]
+                    else:
+                        # print("-", line)
+                        record[tag].append(line)
+                elif len(line) == 2:
+                    record[line] = []
+                # else:
+                # print("*", line)
+
+            for key in record.keys():
+                record[key] = "; ".join(record[key])
+
+            self.record = record
+
+    @lru_cache
+    def __init__(self, docid=None, cache=False):
+        self.docid = None
+        self._ris = None
+        self._risfile = None
+        self._fs = httpstore(cache=cache, cachedir=OPTIONS['cachedir'])
+        self._doiserver = "https://dx.doi.org"
+        self._archimer = "https://archimer.ifremer.fr"
+
+        if isinstance(docid, int):
+            if docid in [doc['id'] for doc in self._catalogue]:
+                self.docid = docid
+            else:
+                raise ValueError("Unknown document id")
+        elif isinstance(docid, str):
+            start_with = lambda f, x: f[0:len(x)] == x if len(x) <= len(f) else False  # noqa: E731
+            if start_with(docid, '10.13155/') and docid in [doc['doi'] for doc in self._catalogue]:
+                self.docid = [doc['id'] for doc in self._catalogue if docid == doc['doi']][0]
+            else:
+                raise ValueError("'docid' must be an integer or a valid Argo DOI")
+
+    def __repr__(self):
+        summary = ["<argopy.ArgoDocs>"]
+        if self.docid is not None:
+            doc = [doc for doc in self._catalogue if doc['id'] == self.docid][0]
+            summary.append("Title: %s" % doc['title'])
+            summary.append("DOI: %s" % doc['doi'])
+            summary.append("url: https://dx.doi.org/%s" % doc['doi'])
+            summary.append("last pdf: %s" % self.pdf)
+            if 'AF' in self.ris:
+                summary.append("Authors: %s" % self.ris['AF'])
+            summary.append("Abstract: %s" % self.ris['AB'])
+        else:
+            summary.append("- %i documents with a DOI are available in the catalogue" % len(self._catalogue))
+            summary.append("- Use the method 'search' to find a document id")
+            summary.append("- Use the property 'list' to check out the catalogue")
+        return "\n".join(summary)
+
+    @property
+    def list(self):
+        """List of all available documents as a :class:`pandas.DataFrame`"""
+        return pd.DataFrame(self._catalogue)
+
+    @property
+    def js(self):
+        """Internal json record for a document"""
+        if self.docid is not None:
+            return [doc for doc in self._catalogue if doc['id'] == self.docid][0]
+        else:
+            raise ValueError("Select a document first !")
+
+    @property
+    def ris(self):
+        """RIS record of a document"""
+        if self.docid is not None:
+            if self._ris is None:
+                # Fetch RIS metadata for this document:
+                import re
+                file = self._fs.download_url("%s/%s" % (self._doiserver, self.js['doi']))
+                x = re.search(r'<a target="_blank" href="(https?:\/\/([^"]*))"\s+([^>]*)rel="nofollow">TXT<\/a>',
+                              str(file))
+                export_txt_url = x[1].replace("https://archimer.ifremer.fr", self._archimer)
+                self._risfile = export_txt_url
+                self._ris = self.RIS(export_txt_url, fs=self._fs).record
+            return self._ris
+        else:
+            raise ValueError("Select a document first !")
+
+    @property
+    def abstract(self):
+        """Abstract of a document"""
+        if self.docid is not None:
+            return self.ris['AB']
+        else:
+            raise ValueError("Select a document first !")
+
+    @property
+    def pdf(self):
+        """Link to the online pdf version of a document"""
+        if self.docid is not None:
+            return self.ris['UR']
+        else:
+            raise ValueError("Select a document first !")
+
+    def show(self, height=800):
+        """Insert document in pdf in a notebook cell
+
+        Parameters
+        ----------
+        height: int
+            Height in pixels of the cell
+        """
+        if self.docid is not None:
+            from IPython.core.display import HTML
+            return HTML(
+                '<embed src="%s" type="application/pdf" width="100%%" height="%ipx" />' % (self.ris['UR'], height))
+        else:
+            raise ValueError("Select a document first !")
+
+    def open_pdf(self, page=None, url_only=False):
+        """Open document in new browser tab
+
+        Parameters
+        ----------
+        page: int, optional
+            Open directly a specific page number
+        """
+        url = self.pdf
+        url += '#view=FitV&pagemode=thumbs'
+        if page:
+            url += '&page=%i' % page
+        if self.docid is not None:
+            if not url_only:
+                import webbrowser
+                webbrowser.open_new(url)
+            else:
+                return url
+        else:
+            raise ValueError("Select a document first !")
+
+    def search(self, txt, where='title'):
+        """Search for string in all documents title or abstract
+
+        Parameters
+        ----------
+        txt: str
+        where: str, default='title'
+            Where to search, can be 'title' or 'abstract'
+
+        Returns
+        -------
+        list
+
+        """
+        results = []
+        for doc in self.list.iterrows():
+            docid = doc[1]['id']
+            if where == 'title':
+                if txt.lower() in ArgoDocs(docid).js['title'].lower():
+                    results.append(docid)
+            elif where == 'abstract':
+                if txt.lower() in ArgoDocs(docid).abstract.lower():
+                    results.append(docid)
+        return results
diff --git a/argopy/related/ocean_ops_deployments.py b/argopy/related/ocean_ops_deployments.py
index a1a2dea6..3350ebd6 100644
--- a/argopy/related/ocean_ops_deployments.py
+++ b/argopy/related/ocean_ops_deployments.py
@@ -57,6 +57,7 @@ class OceanOPSDeployments:
     >>> plan_virtualfleet = deployment.plan
 
     """
+
     api = "https://www.ocean-ops.org"
     """URL to the API"""
 
@@ -64,7 +65,7 @@ class OceanOPSDeployments:
     """This model represents a Platform entity and is used to retrieve a platform information (schema model
      named 'Ptf')."""
 
-    api_server_check = 'https://www.ocean-ops.org/api/1/oceanops-api.yaml'
+    api_server_check = "https://www.ocean-ops.org/api/1/oceanops-api.yaml"
     """URL to check if the API is alive"""
 
     def __init__(self, box: list = None, deployed_only: bool = False):
@@ -91,15 +92,25 @@ def __init__(self, box: list = None, deployed_only: bool = False):
             following status: ``OPERATIONAL``, ``INACTIVE``, and ``CLOSED``.
         """
         if box is None:
-            box = [None, None, None, None, pd.to_datetime('now', utc=True).strftime("%Y-%m-%d"), None]
+            box = [
+                None,
+                None,
+                None,
+                None,
+                pd.to_datetime("now", utc=True).strftime("%Y-%m-%d"),
+                None,
+            ]
         elif len(box) == 4:
-            box.append(pd.to_datetime('now', utc=True).strftime("%Y-%m-%d"))
+            box.append(pd.to_datetime("now", utc=True).strftime("%Y-%m-%d"))
             box.append(None)
         elif len(box) == 5:
             box.append(None)
 
         if len(box) != 6:
-            raise ValueError("The 'box' argument must be: None or of lengths 4 or 5 or 6\n%s" % str(box))
+            raise ValueError(
+                "The 'box' argument must be: None or of lengths 4 or 5 or 6\n%s"
+                % str(box)
+            )
 
         self.box = box
         self.deployed_only = deployed_only
@@ -108,7 +119,7 @@ def __init__(self, box: list = None, deployed_only: bool = False):
         self.fs = httpstore(cache=False)
 
     def __format(self, x, typ: str) -> str:
-        """ string formatting helper """
+        """string formatting helper"""
         if typ == "lon":
             return str(x) if x is not None else "-"
         elif typ == "lat":
@@ -126,8 +137,10 @@ def __repr__(self):
         if self.data is not None:
             summary.append("Nb of floats in the deployment plan: %s" % self.size)
         else:
-            summary.append("Nb of floats in the deployment plan: - [Data not retrieved yet]")
-        return '\n'.join(summary)
+            summary.append(
+                "Nb of floats in the deployment plan: - [Data not retrieved yet]"
+            )
+        return "\n".join(summary)
 
     def __encode_inc(self, inc):
         """Return encoded uri expression for 'include' parameter
@@ -140,7 +153,7 @@ def __encode_inc(self, inc):
         -------
         str
         """
-        return inc.replace("\"", "%22").replace("[", "%5B").replace("]", "%5D")
+        return inc.replace('"', "%22").replace("[", "%5B").replace("]", "%5D")
 
     def __encode_exp(self, exp):
         """Return encoded uri expression for 'exp' parameter
@@ -153,10 +166,19 @@ def __encode_exp(self, exp):
         -------
         str
         """
-        return exp.replace("\"", "%22").replace("'", "%27").replace(" ", "%20").replace(">", "%3E").replace("<", "%3C")
+        return (
+            exp.replace('"', "%22")
+            .replace("'", "%27")
+            .replace(" ", "%20")
+            .replace(">", "%3E")
+            .replace("<", "%3C")
+        )
 
     def __get_uri(self, encoded=False):
-        uri = "exp=%s&include=%s" % (self.exp(encoded=encoded), self.include(encoded=encoded))
+        uri = "exp=%s&include=%s" % (
+            self.exp(encoded=encoded),
+            self.include(encoded=encoded),
+        )
         url = "%s/%s?%s" % (self.api, self.model, uri)
         return url
 
@@ -176,10 +198,20 @@ def include(self, encoded=False):
         # inc = ["ref", "ptfDepl.lat", "ptfDepl.lon", "ptfDepl.deplDate", "ptfStatus", "wmos"]
         # inc = ["ref", "ptfDepl.lat", "ptfDepl.lon", "ptfDepl.deplDate", "ptfStatus.id", "ptfStatus.name", "wmos"]
         # inc = ["ref", "ptfDepl.lat", "ptfDepl.lon", "ptfDepl.deplDate", "ptfStatus.id", "ptfStatus.name"]
-        inc = ["ref", "ptfDepl.lat", "ptfDepl.lon", "ptfDepl.deplDate", "ptfStatus.id", "ptfStatus.name",
-               "ptfStatus.description",
-               "program.nameShort", "program.country.nameShort", "ptfModel.nameShort", "ptfDepl.noSite"]
-        inc = "[%s]" % ",".join(["\"%s\"" % v for v in inc])
+        inc = [
+            "ref",
+            "ptfDepl.lat",
+            "ptfDepl.lon",
+            "ptfDepl.deplDate",
+            "ptfStatus.id",
+            "ptfStatus.name",
+            "ptfStatus.description",
+            "program.nameShort",
+            "program.country.nameShort",
+            "ptfModel.nameShort",
+            "ptfDepl.noSite",
+        ]
+        inc = "[%s]" % ",".join(['"%s"' % v for v in inc])
         return inc if not encoded else self.__encode_inc(inc)
 
     def exp(self, encoded=False):
@@ -209,37 +241,49 @@ def exp(self, encoded=False):
         if len(self.box) > 4:
             if self.box[4] is not None:
                 exp += " and ptfDepl.deplDate>=$var%i" % (len(arg) + 1)
-                arg.append("\"%s\"" % pd.to_datetime(self.box[4]).strftime("%Y-%m-%d %H:%M:%S"))
+                arg.append(
+                    '"%s"' % pd.to_datetime(self.box[4]).strftime("%Y-%m-%d %H:%M:%S")
+                )
             if self.box[5] is not None:
                 exp += " and ptfDepl.deplDate<=$var%i" % (len(arg) + 1)
-                arg.append("\"%s\"" % pd.to_datetime(self.box[5]).strftime("%Y-%m-%d %H:%M:%S"))
+                arg.append(
+                    '"%s"' % pd.to_datetime(self.box[5]).strftime("%Y-%m-%d %H:%M:%S")
+                )
 
         if self.deployed_only:
             exp += " and ptfStatus>=$var%i" % (len(arg) + 1)
             arg.append(str(4))  # Allow for: 4, 5 or 6
 
-        exp = "[\"%s\", %s]" % (exp, ", ".join(arg))
+        exp = '["%s", %s]' % (exp, ", ".join(arg))
         return exp if not encoded else self.__encode_exp(exp)
 
     @property
     def size(self):
-        return len(self.data['data']) if self.data is not None else None
+        return len(self.data["data"]) if self.data is not None else None
 
     @property
     def status_code(self):
         """Return a :class:`pandas.DataFrame` with the definition of status"""
-        status = {'status_code': [0, 1, 2, 6, 4, 5],
-                  'status_name': ['PROBABLE', 'CONFIRMED', 'REGISTERED', 'OPERATIONAL', 'INACTIVE', 'CLOSED'],
-                  'description': [
-                      'Starting status for some platforms, when there is only a few metadata available, like rough deployment location and date. The platform may be deployed',
-                      'Automatically set when a ship is attached to the deployment information. The platform is ready to be deployed, deployment is planned',
-                      'Starting status for most of the networks, when deployment planning is not done. The deployment is certain, and a notification has been sent via the OceanOPS system',
-                      'Automatically set when the platform is emitting a pulse and observations are distributed within a certain time interval',
-                      'The platform is not emitting a pulse since a certain time',
-                      'The platform is not emitting a pulse since a long time, it is considered as dead',
-                    ],
-                  }
-        return pd.DataFrame(status).set_index('status_code')
+        status = {
+            "status_code": [0, 1, 2, 6, 4, 5],
+            "status_name": [
+                "PROBABLE",
+                "CONFIRMED",
+                "REGISTERED",
+                "OPERATIONAL",
+                "INACTIVE",
+                "CLOSED",
+            ],
+            "description": [
+                "Starting status for some platforms, when there is only a few metadata available, like rough deployment location and date. The platform may be deployed",
+                "Automatically set when a ship is attached to the deployment information. The platform is ready to be deployed, deployment is planned",
+                "Starting status for most of the networks, when deployment planning is not done. The deployment is certain, and a notification has been sent via the OceanOPS system",
+                "Automatically set when the platform is emitting a pulse and observations are distributed within a certain time interval",
+                "The platform is not emitting a pulse since a certain time",
+                "The platform is not emitting a pulse since a long time, it is considered as dead",
+            ],
+        }
+        return pd.DataFrame(status).set_index("status_code")
 
     @property
     def box_name(self):
@@ -289,10 +333,14 @@ def plan(self):
         This method is for dev, but will be moved to the VirtualFleet software utilities
         """
         df = self.to_dataframe()
-        plan = df[['lon', 'lat', 'date']].rename(columns={"date": "time"}).to_dict('series')
+        plan = (
+            df[["lon", "lat", "date"]]
+            .rename(columns={"date": "time"})
+            .to_dict("series")
+        )
         for key in plan.keys():
             plan[key] = plan[key].to_list()
-        plan['time'] = np.array(plan['time'], dtype='datetime64')
+        plan["time"] = np.array(plan["time"], dtype="datetime64")
         return plan
 
     def to_json(self):
@@ -309,49 +357,59 @@ def to_dataframe(self):
         :class:`pandas.DataFrame`
         """
         data = self.to_json()
-        if data['total'] == 0:
-            raise DataNotFound('Your search matches no results')
+        if data["total"] == 0:
+            raise DataNotFound("Your search matches no results")
 
         # res = {'date': [], 'lat': [], 'lon': [], 'wmo': [], 'status_name': [], 'status_code': []}
         # res = {'date': [], 'lat': [], 'lon': [], 'wmo': [], 'status_name': [], 'status_code': [], 'ship_name': []}
-        res = {'date': [], 'lat': [], 'lon': [], 'wmo': [], 'status_name': [], 'status_code': [], 'program': [],
-               'country': [], 'model': []}
+        res = {
+            "date": [],
+            "lat": [],
+            "lon": [],
+            "wmo": [],
+            "status_name": [],
+            "status_code": [],
+            "program": [],
+            "country": [],
+            "model": [],
+        }
         # status = {'REGISTERED': None, 'OPERATIONAL': None, 'INACTIVE': None, 'CLOSED': None,
         #           'CONFIRMED': None, 'OPERATIONAL': None, 'PROBABLE': None, 'REGISTERED': None}
 
-        for irow, ptf in enumerate(data['data']):
+        for irow, ptf in enumerate(data["data"]):
             # if irow == 0:
             # print(ptf)
-            res['lat'].append(ptf['ptfDepl']['lat'])
-            res['lon'].append(ptf['ptfDepl']['lon'])
-            res['date'].append(ptf['ptfDepl']['deplDate'])
-            res['wmo'].append(ptf['ref'])
+            res["lat"].append(ptf["ptfDepl"]["lat"])
+            res["lon"].append(ptf["ptfDepl"]["lon"])
+            res["date"].append(ptf["ptfDepl"]["deplDate"])
+            res["wmo"].append(ptf["ref"])
             # res['wmo'].append(ptf['wmos'][-1]['wmo'])
             # res['wmo'].append(float_wmo(ptf['ref'])) # will not work for some CONFIRMED, PROBABLE or REGISTERED floats
             # res['wmo'].append(float_wmo(ptf['wmos'][-1]['wmo']))
-            res['status_code'].append(ptf['ptfStatus']['id'])
-            res['status_name'].append(ptf['ptfStatus']['name'])
+            res["status_code"].append(ptf["ptfStatus"]["id"])
+            res["status_name"].append(ptf["ptfStatus"]["name"])
 
             # res['ship_name'].append(ptf['ptfDepl']['shipName'])
-            program = ptf['program']['nameShort'].replace("_", " ") if ptf['program']['nameShort'] else ptf['program'][
-                'nameShort']
-            res['program'].append(program)
-            res['country'].append(ptf['program']['country']['nameShort'])
-            res['model'].append(ptf['ptfModel']['nameShort'])
+            program = (
+                ptf["program"]["nameShort"].replace("_", " ")
+                if ptf["program"]["nameShort"]
+                else ptf["program"]["nameShort"]
+            )
+            res["program"].append(program)
+            res["country"].append(ptf["program"]["country"]["nameShort"])
+            res["model"].append(ptf["ptfModel"]["nameShort"])
 
             # if status[ptf['ptfStatus']['name']] is None:
             #     status[ptf['ptfStatus']['name']] = ptf['ptfStatus']['description']
 
         df = pd.DataFrame(res)
-        df = df.astype({'date': 'datetime64[s]'})
-        df = df.sort_values(by='date').reset_index(drop=True)
+        df = df.astype({"date": "datetime64[s]"})
+        df = df.sort_values(by="date").reset_index(drop=True)
         # df = df[ (df['status_name'] == 'CLOSED') | (df['status_name'] == 'OPERATIONAL')] # Select only floats that have been deployed and returned data
         # print(status)
         return df
 
-    def plot_status(self,
-                    **kwargs
-                    ):
+    def plot_status(self, **kwargs):
         """Quick plot of the deployment plan
 
         Named arguments are passed to :class:`plot.scatter_map`
@@ -362,16 +420,21 @@ def plot_status(self,
         ax: :class:`matplotlib.axes.Axes`
         """
         df = self.to_dataframe()
-        fig, ax = scatter_map(df,
-                              x='lon',
-                              y='lat',
-                              hue='status_code',
-                              traj=False,
-                              cmap='deployment_status',
-                              **kwargs)
-        ax.set_title("Argo network deployment plan\n%s\nSource: OceanOPS API as of %s"
-                     % (self.box_name, pd.to_datetime('now', utc=True).strftime("%Y-%m-%d %H:%M:%S")),
-                     fontsize=12
-                     )
+        fig, ax = scatter_map(
+            df,
+            x="lon",
+            y="lat",
+            hue="status_code",
+            traj=False,
+            cmap="deployment_status",
+            **kwargs
+        )
+        ax.set_title(
+            "Argo network deployment plan\n%s\nSource: OceanOPS API as of %s"
+            % (
+                self.box_name,
+                pd.to_datetime("now", utc=True).strftime("%Y-%m-%d %H:%M:%S"),
+            ),
+            fontsize=12,
+        )
         return fig, ax
-
diff --git a/argopy/related/reference_tables.py b/argopy/related/reference_tables.py
new file mode 100644
index 00000000..622eee7f
--- /dev/null
+++ b/argopy/related/reference_tables.py
@@ -0,0 +1,245 @@
+import pandas as pd
+from functools import lru_cache
+import collections
+from ..stores import httpstore
+from ..options import OPTIONS
+
+
+class ArgoNVSReferenceTables:
+    """Argo Reference Tables
+
+    Utility function to retrieve Argo Reference Tables from a NVS server.
+
+    By default, this relies on: https://vocab.nerc.ac.uk/collection
+
+    Examples
+    --------
+    Methods:
+
+    >>> R = ArgoNVSReferenceTables()
+    >>> R.search('sensor')
+    >>> R.tbl(3)
+    >>> R.tbl('R09')
+
+    Properties:
+
+    >>> R.all_tbl_name
+    >>> R.all_tbl
+    >>> R.valid_ref
+
+    """
+
+    valid_ref = [
+        "R01",
+        "RR2",
+        "RD2",
+        "RP2",
+        "R03",
+        "R04",
+        "R05",
+        "R06",
+        "R07",
+        "R08",
+        "R09",
+        "R10",
+        "R11",
+        "R12",
+        "R13",
+        "R15",
+        "RMC",
+        "RTV",
+        "R16",
+        # "R18",
+        "R19",
+        "R20",
+        "R21",
+        "R22",
+        "R23",
+        "R24",
+        "R25",
+        "R26",
+        "R27",
+        # "R28",
+        # "R29",
+        # "R30",
+        "R40",
+    ]
+    """List of all available Reference Tables"""
+
+    def __init__(
+        self,
+        nvs="https://vocab.nerc.ac.uk/collection",
+        cache: bool = True,
+        cachedir: str = "",
+    ):
+        """Argo Reference Tables from NVS"""
+
+        cachedir = OPTIONS["cachedir"] if cachedir == "" else cachedir
+        self.fs = httpstore(cache=cache, cachedir=cachedir)
+        self.nvs = nvs
+
+    def _valid_ref(self, rtid):
+        if rtid not in self.valid_ref:
+            rtid = "R%0.2d" % rtid
+            if rtid not in self.valid_ref:
+                raise ValueError(
+                    "Invalid Argo Reference Table, should be one in: %s"
+                    % ", ".join(self.valid_ref)
+                )
+        return rtid
+
+    def _jsConcept2df(self, data):
+        """Return all skos:Concept as class:`pandas.DataFrame`"""
+        content = {
+            "altLabel": [],
+            "prefLabel": [],
+            "definition": [],
+            "deprecated": [],
+            "id": [],
+        }
+        for k in data["@graph"]:
+            if k["@type"] == "skos:Collection":
+                Collection_name = k["alternative"]
+            elif k["@type"] == "skos:Concept":
+                content["altLabel"].append(k["altLabel"])
+                content["prefLabel"].append(k["prefLabel"]["@value"])
+                content["definition"].append(k["definition"]["@value"])
+                content["deprecated"].append(k["deprecated"])
+                content["id"].append(k["@id"])
+        df = pd.DataFrame.from_dict(content)
+        df.name = Collection_name
+        return df
+
+    def _jsCollection(self, data):
+        """Return last skos:Collection information as data"""
+        for k in data["@graph"]:
+            if k["@type"] == "skos:Collection":
+                name = k["alternative"]
+                desc = k["description"]
+                rtid = k["@id"]
+        return (name, desc, rtid)
+
+    def get_url(self, rtid, fmt="ld+json"):
+        """Return URL toward a given reference table for a given format
+
+        Parameters
+        ----------
+        rtid: {str, int}
+            Name or number of the reference table to retrieve. Eg: 'R01', 12
+        fmt: str, default: "ld+json"
+            Format of the NVS server response. Can be: "ld+json", "rdf+xml" or "text/turtle".
+
+        Returns
+        -------
+        str
+        """
+        rtid = self._valid_ref(rtid)
+        if fmt == "ld+json":
+            fmt_ext = "?_profile=nvs&_mediatype=application/ld+json"
+        elif fmt == "rdf+xml":
+            fmt_ext = "?_profile=nvs&_mediatype=application/rdf+xml"
+        elif fmt == "text/turtle":
+            fmt_ext = "?_profile=nvs&_mediatype=text/turtle"
+        else:
+            raise ValueError(
+                "Invalid format. Must be in: 'ld+json', 'rdf+xml' or 'text/turtle'."
+            )
+        url = "{}/{}/current/{}".format
+        return url(self.nvs, rtid, fmt_ext)
+
+    @lru_cache
+    def tbl(self, rtid):
+        """Return an Argo Reference table
+
+        Parameters
+        ----------
+        rtid: {str, int}
+            Name or number of the reference table to retrieve. Eg: 'R01', 12
+
+        Returns
+        -------
+        class:`pandas.DataFrame`
+        """
+        rtid = self._valid_ref(rtid)
+        js = self.fs.open_json(self.get_url(rtid))
+        df = self._jsConcept2df(js)
+        return df
+
+    def tbl_name(self, rtid):
+        """Return name of an Argo Reference table
+
+        Parameters
+        ----------
+        rtid: {str, int}
+            Name or number of the reference table to retrieve. Eg: 'R01', 12
+
+        Returns
+        -------
+        tuple('short name', 'description', 'NVS id link')
+        """
+        rtid = self._valid_ref(rtid)
+        js = self.fs.open_json(self.get_url(rtid))
+        return self._jsCollection(js)
+
+    def search(self, txt, where="all"):
+        """Search for string in tables title and/or description
+
+        Parameters
+        ----------
+        txt: str
+        where: str, default='all'
+            Where to search, can be: 'title', 'description', 'all'
+
+        Returns
+        -------
+        list of table id matching the search
+        """
+        results = []
+        for tbl_id in self.all_tbl_name:
+            title = self.tbl_name(tbl_id)[0]
+            description = self.tbl_name(tbl_id)[1]
+            if where == "title":
+                if txt.lower() in title.lower():
+                    results.append(tbl_id)
+            elif where == "description":
+                if txt.lower() in description.lower():
+                    results.append(tbl_id)
+            elif where == "all":
+                if txt.lower() in description.lower() or txt.lower() in title.lower():
+                    results.append(tbl_id)
+        return results
+
+    @property
+    def all_tbl(self):
+        """Return all Argo Reference tables
+
+        Returns
+        -------
+        OrderedDict
+            Dictionary with all table short names as key and table content as class:`pandas.DataFrame`
+        """
+        URLs = [self.get_url(rtid) for rtid in self.valid_ref]
+        df_list = self.fs.open_mfjson(URLs, preprocess=self._jsConcept2df)
+        all_tables = {}
+        [all_tables.update({t.name: t}) for t in df_list]
+        all_tables = collections.OrderedDict(sorted(all_tables.items()))
+        return all_tables
+
+    @property
+    def all_tbl_name(self):
+        """Return names of all Argo Reference tables
+
+        Returns
+        -------
+        OrderedDict
+            Dictionary with all table short names as key and table names as tuple('short name', 'description', 'NVS id link')
+        """
+        URLs = [self.get_url(rtid) for rtid in self.valid_ref]
+        name_list = self.fs.open_mfjson(URLs, preprocess=self._jsCollection)
+        all_tables = {}
+        [
+            all_tables.update({rtid.split("/")[-3]: (name, desc, rtid)})
+            for name, desc, rtid in name_list
+        ]
+        all_tables = collections.OrderedDict(sorted(all_tables.items()))
+        return all_tables
diff --git a/argopy/related/topography.py b/argopy/related/topography.py
index 39b7f4b1..dde36773 100644
--- a/argopy/related/topography.py
+++ b/argopy/related/topography.py
@@ -5,7 +5,7 @@
 
 
 class TopoFetcher:
-    """ Fetch topographic data through an ERDDAP server for an ocean rectangle
+    """Fetch topographic data through an ERDDAP server for an ocean rectangle
 
     Example:
         >>> from argopy import TopoFetcher
@@ -34,7 +34,7 @@ def __init__(
         server: Union[str] = None,
         **kwargs,
     ):
-        """ Instantiate an ERDDAP topo data fetcher
+        """Instantiate an ERDDAP topo data fetcher
 
         Parameters
         ----------
@@ -61,7 +61,11 @@ def __init__(
         self.stride = stride
         if ds == "gebco":
             self.definition = "NOAA erddap gebco data fetcher for a space region"
-            self.server = server if server is not None else "https://coastwatch.pfeg.noaa.gov/erddap"
+            self.server = (
+                server
+                if server is not None
+                else "https://coastwatch.pfeg.noaa.gov/erddap"
+            )
             self.server_name = "NOAA"
             self.dataset_id = "gebco"
 
@@ -81,7 +85,7 @@ def _init_erddap(self):
         return self
 
     def _cname(self) -> str:
-        """ Fetcher one line string definition helper """
+        """Fetcher one line string definition helper"""
         cname = "?"
 
         if hasattr(self, "BOX"):
@@ -102,12 +106,12 @@ def __repr__(self):
         return "\n".join(summary)
 
     def cname(self):
-        """ Return a unique string defining the constraints """
+        """Return a unique string defining the constraints"""
         return self._cname()
 
     @property
     def cachepath(self):
-        """ Return path to cached file(s) for this request
+        """Return path to cached file(s) for this request
 
         Returns
         -------
@@ -116,7 +120,7 @@ def cachepath(self):
         return [self.fs.cachepath(uri) for uri in self.uri]
 
     def define_constraints(self):
-        """ Define request constraints """
+        """Define request constraints"""
         #        Eg: https://coastwatch.pfeg.noaa.gov/erddap/griddap/GEBCO_2020.nc?elevation%5B(34):5:(42)%5D%5B(-21):7:(-12)%5D
         self.erddap.constraints = "%s(%0.2f):%i:(%0.2f)%s%s(%0.2f):%i:(%0.2f)%s" % (
             "%5B",
@@ -142,9 +146,9 @@ def define_constraints(self):
     #         return vlist
 
     def url_encode(self, url):
-        """ Return safely encoded list of urls
+        """Return safely encoded list of urls
 
-            This is necessary because fsspec cannot handle in cache paths/urls with a '[' character
+        This is necessary because fsspec cannot handle in cache paths/urls with a '[' character
         """
 
         # return urls
@@ -156,7 +160,7 @@ def safe_for_fsspec_cache(url):
         return safe_for_fsspec_cache(url)
 
     def get_url(self):
-        """ Return the URL to download data requested
+        """Return the URL to download data requested
 
         Returns
         -------
@@ -181,7 +185,7 @@ def get_url(self):
 
     @property
     def uri(self):
-        """ List of files to load for a request
+        """List of files to load for a request
 
         Returns
         -------
@@ -190,7 +194,7 @@ def uri(self):
         return [self.get_url()]
 
     def to_xarray(self, errors: str = "ignore"):
-        """ Load Topographic data and return a xarray.DataSet """
+        """Load Topographic data and return a xarray.DataSet"""
 
         # Download data
         if len(self.uri) == 1:
@@ -199,5 +203,5 @@ def to_xarray(self, errors: str = "ignore"):
         return ds
 
     def load(self, errors: str = "ignore"):
-        """ Load Topographic data and return a xarray.DataSet """
+        """Load Topographic data and return a xarray.DataSet"""
         return self.to_xarray(errors=errors)
diff --git a/argopy/utilities.py b/argopy/utilities.py
index fc6c8e37..831b05fb 100644
--- a/argopy/utilities.py
+++ b/argopy/utilities.py
@@ -2705,243 +2705,6 @@ def get_ea_profile_page(WMO, CYC=None, **kwargs):
     return [url.format(this_id) for this_id in sorted(df["ID"])]
 
 
-class ArgoNVSReferenceTables:
-    """Argo Reference Tables
-
-    Utility function to retrieve Argo Reference Tables from a NVS server.
-
-    By default, this relies on: https://vocab.nerc.ac.uk/collection
-
-    Examples
-    --------
-    Methods:
-
-    >>> R = ArgoNVSReferenceTables()
-    >>> R.search('sensor')
-    >>> R.tbl(3)
-    >>> R.tbl('R09')
-
-    Properties:
-
-    >>> R.all_tbl_name
-    >>> R.all_tbl
-    >>> R.valid_ref
-
-    """
-    valid_ref = [
-        "R01",
-        "RR2",
-        "RD2",
-        "RP2",
-        "R03",
-        "R04",
-        "R05",
-        "R06",
-        "R07",
-        "R08",
-        "R09",
-        "R10",
-        "R11",
-        "R12",
-        "R13",
-        "R15",
-        "RMC",
-        "RTV",
-        "R16",
-        # "R18",
-        "R19",
-        "R20",
-        "R21",
-        "R22",
-        "R23",
-        "R24",
-        "R25",
-        "R26",
-        "R27",
-        # "R28",
-        # "R29",
-        # "R30",
-        "R40",
-    ]
-    """List of all available Reference Tables"""
-
-    def __init__(self,
-                 nvs="https://vocab.nerc.ac.uk/collection",
-                 cache: bool = True,
-                 cachedir: str = "",
-                 ):
-        """Argo Reference Tables from NVS"""
-        from .stores import httpstore
-        cachedir = OPTIONS["cachedir"] if cachedir == "" else cachedir
-        self.fs = httpstore(cache=cache, cachedir=cachedir)
-        self.nvs = nvs
-
-    def _valid_ref(self, rtid):
-        if rtid not in self.valid_ref:
-            rtid = "R%0.2d" % rtid
-            if rtid not in self.valid_ref:
-                raise ValueError(
-                    "Invalid Argo Reference Table, should be one in: %s"
-                    % ", ".join(self.valid_ref)
-                )
-        return rtid
-
-    def _jsConcept2df(self, data):
-        """Return all skos:Concept as class:`pandas.DataFrame`"""
-        content = {
-            "altLabel": [],
-            "prefLabel": [],
-            "definition": [],
-            "deprecated": [],
-            "id": [],
-        }
-        for k in data["@graph"]:
-            if k["@type"] == "skos:Collection":
-                Collection_name = k["alternative"]
-            elif k["@type"] == "skos:Concept":
-                content["altLabel"].append(k["altLabel"])
-                content["prefLabel"].append(k["prefLabel"]["@value"])
-                content["definition"].append(k["definition"]["@value"])
-                content["deprecated"].append(k["deprecated"])
-                content["id"].append(k["@id"])
-        df = pd.DataFrame.from_dict(content)
-        df.name = Collection_name
-        return df
-
-    def _jsCollection(self, data):
-        """Return last skos:Collection information as data"""
-        for k in data["@graph"]:
-            if k["@type"] == "skos:Collection":
-                name = k["alternative"]
-                desc = k["description"]
-                rtid = k["@id"]
-        return (name, desc, rtid)
-
-    def get_url(self, rtid, fmt="ld+json"):
-        """Return URL toward a given reference table for a given format
-
-        Parameters
-        ----------
-        rtid: {str, int}
-            Name or number of the reference table to retrieve. Eg: 'R01', 12
-        fmt: str, default: "ld+json"
-            Format of the NVS server response. Can be: "ld+json", "rdf+xml" or "text/turtle".
-
-        Returns
-        -------
-        str
-        """
-        rtid = self._valid_ref(rtid)
-        if fmt == "ld+json":
-            fmt_ext = "?_profile=nvs&_mediatype=application/ld+json"
-        elif fmt == "rdf+xml":
-            fmt_ext = "?_profile=nvs&_mediatype=application/rdf+xml"
-        elif fmt == "text/turtle":
-            fmt_ext = "?_profile=nvs&_mediatype=text/turtle"
-        else:
-            raise ValueError("Invalid format. Must be in: 'ld+json', 'rdf+xml' or 'text/turtle'.")
-        url = "{}/{}/current/{}".format
-        return url(self.nvs, rtid, fmt_ext)
-
-    @lru_cache
-    def tbl(self, rtid):
-        """Return an Argo Reference table
-
-        Parameters
-        ----------
-        rtid: {str, int}
-            Name or number of the reference table to retrieve. Eg: 'R01', 12
-
-        Returns
-        -------
-        class:`pandas.DataFrame`
-        """
-        rtid = self._valid_ref(rtid)
-        js = self.fs.open_json(self.get_url(rtid))
-        df = self._jsConcept2df(js)
-        return df
-
-    def tbl_name(self, rtid):
-        """Return name of an Argo Reference table
-
-        Parameters
-        ----------
-        rtid: {str, int}
-            Name or number of the reference table to retrieve. Eg: 'R01', 12
-
-        Returns
-        -------
-        tuple('short name', 'description', 'NVS id link')
-        """
-        rtid = self._valid_ref(rtid)
-        js = self.fs.open_json(self.get_url(rtid))
-        return self._jsCollection(js)
-
-    def search(self, txt, where='all'):
-        """Search for string in tables title and/or description
-
-        Parameters
-        ----------
-        txt: str
-        where: str, default='all'
-            Where to search, can be: 'title', 'description', 'all'
-
-        Returns
-        -------
-        list of table id matching the search
-        """
-        results = []
-        for tbl_id in self.all_tbl_name:
-            title = self.tbl_name(tbl_id)[0]
-            description = self.tbl_name(tbl_id)[1]
-            if where == 'title':
-                if txt.lower() in title.lower():
-                    results.append(tbl_id)
-            elif where == 'description':
-                if txt.lower() in description.lower():
-                    results.append(tbl_id)
-            elif where == 'all':
-                if txt.lower() in description.lower() or txt.lower() in title.lower():
-                    results.append(tbl_id)
-        return results
-
-    @property
-    def all_tbl(self):
-        """Return all Argo Reference tables
-
-        Returns
-        -------
-        OrderedDict
-            Dictionary with all table short names as key and table content as class:`pandas.DataFrame`
-        """
-        URLs = [self.get_url(rtid) for rtid in self.valid_ref]
-        df_list = self.fs.open_mfjson(URLs, preprocess=self._jsConcept2df)
-        all_tables = {}
-        [all_tables.update({t.name: t}) for t in df_list]
-        all_tables = collections.OrderedDict(sorted(all_tables.items()))
-        return all_tables
-
-    @property
-    def all_tbl_name(self):
-        """Return names of all Argo Reference tables
-
-        Returns
-        -------
-        OrderedDict
-            Dictionary with all table short names as key and table names as tuple('short name', 'description', 'NVS id link')
-        """
-        URLs = [self.get_url(rtid) for rtid in self.valid_ref]
-        name_list = self.fs.open_mfjson(URLs, preprocess=self._jsCollection)
-        all_tables = {}
-        [
-            all_tables.update({rtid.split("/")[-3]: (name, desc, rtid)})
-            for name, desc, rtid in name_list
-        ]
-        all_tables = collections.OrderedDict(sorted(all_tables.items()))
-        return all_tables
-
-
-
 @deprecated
 def cast_types(ds):  # noqa: C901
     """ Make sure variables are of the appropriate types according to Argo
@@ -3314,352 +3077,6 @@ def log_argopy_callerstack(level='debug'):
                 log.warning(msg)
 
 
-class ArgoDocs:
-    """ADMT documentation helper class
-
-    Examples
-    --------
-    >>> ArgoDocs().list
-    >>> ArgoDocs().search("CDOM")
-    >>> ArgoDocs().search("CDOM", where='abstract')
-
-    >>> ArgoDocs(35385)
-    >>> ArgoDocs(35385).ris
-    >>> ArgoDocs(35385).abstract
-    >>> ArgoDocs(35385).show()
-    >>> ArgoDocs(35385).open_pdf()
-    >>> ArgoDocs(35385).open_pdf(page=12)
-
-    """
-    _catalogue = [
-        {
-            "category": "Argo data formats",
-            "title": "Argo user's manual",
-            "doi": "10.13155/29825",
-            "id": 29825
-        },
-        {
-            "category": "Quality control",
-            "title": "Argo Quality Control Manual for CTD and Trajectory Data",
-            "doi": "10.13155/33951",
-            "id": 33951
-        },
-        {
-            "category": "Quality control",
-            "title": "Argo quality control manual for dissolved oxygen concentration",
-            "doi": "10.13155/46542",
-            "id": 46542
-        },
-        {
-            "category": "Quality control",
-            "title": "Argo quality control manual for biogeochemical data",
-            "doi": "10.13155/40879",
-            "id": 40879
-        },
-        {
-            "category": "Quality control",
-            "title": "BGC-Argo quality control manual for the Chlorophyll-A concentration",
-            "doi": "10.13155/35385",
-            "id": 35385
-        },
-        {
-            "category": "Quality control",
-            "title": "BGC-Argo quality control manual for nitrate concentration",
-            "doi": "10.13155/84370",
-            "id": 84370
-        },
-        {
-            "category": "Quality control",
-            "title": "Quality control for BGC-Argo radiometry",
-            "doi": "10.13155/62466",
-            "id": 62466
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Argo DAC profile cookbook",
-            "doi": "10.13155/41151",
-            "id": 41151
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Argo DAC trajectory cookbook",
-            "doi": "10.13155/29824",
-            "id": 29824
-        },
-        {
-            "category": "Cookbooks",
-            "title": "DMQC Cookbook for Core Argo parameters",
-            "doi": "10.13155/78994",
-            "id": 78994
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Processing Argo oxygen data at the DAC level",
-            "doi": "10.13155/39795",
-            "id": 39795
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Processing Bio-Argo particle backscattering at the DAC level",
-            "doi": "10.13155/39459",
-            "id": 39459
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Processing BGC-Argo chlorophyll-A concentration at the DAC level",
-            "doi": "10.13155/39468",
-            "id": 39468
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Processing Argo measurement timing information at the DAC level",
-            "doi": "10.13155/47998",
-            "id": 47998
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Processing BGC-Argo CDOM concentration at the DAC level",
-            "doi": "10.13155/54541",
-            "id": 54541
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Processing Bio-Argo nitrate concentration at the DAC Level",
-            "doi": "10.13155/46121",
-            "id": 46121
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Processing BGC-Argo Radiometric data at the DAC level",
-            "doi": "10.13155/51541",
-            "id": 51541
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Processing BGC-Argo pH data at the DAC level",
-            "doi": "10.13155/57195",
-            "id": 57195
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Description of the Argo GDAC File Checks: Data Format and Consistency Checks",
-            "doi": "10.13155/46120",
-            "id": 46120
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Description of the Argo GDAC File Merge Process",
-            "doi": "10.13155/52154",
-            "id": 52154
-        },
-        {
-            "category": "Cookbooks",
-            "title": "BGC-Argo synthetic profile file processing and format on Coriolis GDAC",
-            "doi": "10.13155/55637",
-            "id": 55637
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Argo GDAC cookbook",
-            "doi": "10.13155/46202",
-            "id": 46202
-        }
-    ]
-
-    class RIS:
-        """RIS file structure from TXT file"""
-
-        def __init__(self, file=None, fs=None):
-            self.record = None
-            self.fs = fs
-            if file:
-                self.parse(file)
-
-        def parse(self, file):
-            """Parse input file"""
-            # log.debug(file)
-
-            with self.fs.open(file, 'r', encoding="utf-8") as f:
-                TXTlines = f.readlines()
-            lines = []
-            # Eliminate blank lines
-            for line in TXTlines:
-                line = line.strip()
-                if len(line) > 0:
-                    lines.append(line)
-            TXTlines = lines
-
-            #
-            record = {}
-            for line in TXTlines:
-                # print("\n>", line)
-                if len(line) > 2:
-                    if line[2] == " ":
-                        tag = line[0:2]
-                        field = line[3:]
-                        # print("ok", {tag: field})
-                        record[tag] = [field]
-                    else:
-                        # print("-", line)
-                        record[tag].append(line)
-                elif len(line) == 2:
-                    record[line] = []
-                # else:
-                # print("*", line)
-
-            for key in record.keys():
-                record[key] = "; ".join(record[key])
-
-            self.record = record
-
-    @lru_cache
-    def __init__(self, docid=None, cache=False):
-        from .stores import httpstore
-
-        self.docid = None
-        self._ris = None
-        self._risfile = None
-        self._fs = httpstore(cache=cache, cachedir=OPTIONS['cachedir'])
-        self._doiserver = "https://dx.doi.org"
-        self._archimer = "https://archimer.ifremer.fr"
-
-        if isinstance(docid, int):
-            if docid in [doc['id'] for doc in self._catalogue]:
-                self.docid = docid
-            else:
-                raise ValueError("Unknown document id")
-        elif isinstance(docid, str):
-            start_with = lambda f, x: f[0:len(x)] == x if len(x) <= len(f) else False  # noqa: E731
-            if start_with(docid, '10.13155/') and docid in [doc['doi'] for doc in self._catalogue]:
-                self.docid = [doc['id'] for doc in self._catalogue if docid == doc['doi']][0]
-            else:
-                raise ValueError("'docid' must be an integer or a valid Argo DOI")
-
-    def __repr__(self):
-        summary = ["<argopy.ArgoDocs>"]
-        if self.docid is not None:
-            doc = [doc for doc in self._catalogue if doc['id'] == self.docid][0]
-            summary.append("Title: %s" % doc['title'])
-            summary.append("DOI: %s" % doc['doi'])
-            summary.append("url: https://dx.doi.org/%s" % doc['doi'])
-            summary.append("last pdf: %s" % self.pdf)
-            if 'AF' in self.ris:
-                summary.append("Authors: %s" % self.ris['AF'])
-            summary.append("Abstract: %s" % self.ris['AB'])
-        else:
-            summary.append("- %i documents with a DOI are available in the catalogue" % len(self._catalogue))
-            summary.append("- Use the method 'search' to find a document id")
-            summary.append("- Use the property 'list' to check out the catalogue")
-        return "\n".join(summary)
-
-    @property
-    def list(self):
-        """List of all available documents as a :class:`pandas.DataFrame`"""
-        return pd.DataFrame(self._catalogue)
-
-    @property
-    def js(self):
-        """Internal json record for a document"""
-        if self.docid is not None:
-            return [doc for doc in self._catalogue if doc['id'] == self.docid][0]
-        else:
-            raise ValueError("Select a document first !")
-
-    @property
-    def ris(self):
-        """RIS record of a document"""
-        if self.docid is not None:
-            if self._ris is None:
-                # Fetch RIS metadata for this document:
-                import re
-                file = self._fs.download_url("%s/%s" % (self._doiserver, self.js['doi']))
-                x = re.search(r'<a target="_blank" href="(https?:\/\/([^"]*))"\s+([^>]*)rel="nofollow">TXT<\/a>',
-                              str(file))
-                export_txt_url = x[1].replace("https://archimer.ifremer.fr", self._archimer)
-                self._risfile = export_txt_url
-                self._ris = self.RIS(export_txt_url, fs=self._fs).record
-            return self._ris
-        else:
-            raise ValueError("Select a document first !")
-
-    @property
-    def abstract(self):
-        """Abstract of a document"""
-        if self.docid is not None:
-            return self.ris['AB']
-        else:
-            raise ValueError("Select a document first !")
-
-    @property
-    def pdf(self):
-        """Link to the online pdf version of a document"""
-        if self.docid is not None:
-            return self.ris['UR']
-        else:
-            raise ValueError("Select a document first !")
-
-    def show(self, height=800):
-        """Insert document in pdf in a notebook cell
-
-        Parameters
-        ----------
-        height: int
-            Height in pixels of the cell
-        """
-        if self.docid is not None:
-            from IPython.core.display import HTML
-            return HTML(
-                '<embed src="%s" type="application/pdf" width="100%%" height="%ipx" />' % (self.ris['UR'], height))
-        else:
-            raise ValueError("Select a document first !")
-
-    def open_pdf(self, page=None, url_only=False):
-        """Open document in new browser tab
-
-        Parameters
-        ----------
-        page: int, optional
-            Open directly a specific page number
-        """
-        url = self.pdf
-        url += '#view=FitV&pagemode=thumbs'
-        if page:
-            url += '&page=%i' % page
-        if self.docid is not None:
-            if not url_only:
-                import webbrowser
-                webbrowser.open_new(url)
-            else:
-                return url
-        else:
-            raise ValueError("Select a document first !")
-
-    def search(self, txt, where='title'):
-        """Search for string in all documents title or abstract
-
-        Parameters
-        ----------
-        txt: str
-        where: str, default='title'
-            Where to search, can be 'title' or 'abstract'
-
-        Returns
-        -------
-        list
-
-        """
-        results = []
-        for doc in self.list.iterrows():
-            docid = doc[1]['id']
-            if where == 'title':
-                if txt.lower() in ArgoDocs(docid).js['title'].lower():
-                    results.append(docid)
-            elif where == 'abstract':
-                if txt.lower() in ArgoDocs(docid).abstract.lower():
-                    results.append(docid)
-        return results
-
-
 def drop_variables_not_in_all_datasets(ds_collection):
     """Drop variables that are not in all datasets (the lowest common denominator)
 

From 3db2954dccc4576e127f8079563a6421b3c6ba00 Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Wed, 6 Sep 2023 16:27:30 +0200
Subject: [PATCH 05/33] Update __init__.py

---
 argopy/__init__.py | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/argopy/__init__.py b/argopy/__init__.py
index 8f2c8392..72602786 100644
--- a/argopy/__init__.py
+++ b/argopy/__init__.py
@@ -35,13 +35,12 @@
 from . import plot  # noqa: E402
 from .plot import dashboard, ArgoColors  # noqa: E402
 from .utilities import show_versions, show_options, clear_cache, lscache  # noqa: E402
-from .utilities import ArgoDocs  # noqa: E402
 from .utilities import monitor_status as status  # noqa: E402
 from .options import set_options, reset_options  # noqa: E402
 from .data_fetchers import CTDRefDataFetcher  # noqa: E402
 from .stores import ArgoIndex  # noqa: E402
 from .utils import compute  # noqa: E402, F401
-from .related import TopoFetcher, OceanOPSDeployments, ArgoNVSReferenceTables  # noqa: E402
+from .related import TopoFetcher, OceanOPSDeployments, ArgoNVSReferenceTables, ArgoDocs  # noqa: E402
 
 #
 __all__ = (
@@ -73,7 +72,6 @@
     "errors",
     "plot",
     "ArgoColors",  # Class
-    # "plotters",  # Deprec, to be removed after 0.1.13
     "stores",
     "tutorial",
     # Constants

From b64fabe2ecc2c957cd5fb3400450baf265d9f9ec Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Wed, 6 Sep 2023 16:27:50 +0200
Subject: [PATCH 06/33] refactor tests locations

---
 argopy/tests/test_related.py   | 303 +++++++++++++++++++++++++++++++++
 argopy/tests/test_utilities.py | 287 -------------------------------
 2 files changed, 303 insertions(+), 287 deletions(-)
 create mode 100644 argopy/tests/test_related.py

diff --git a/argopy/tests/test_related.py b/argopy/tests/test_related.py
new file mode 100644
index 00000000..82f2028c
--- /dev/null
+++ b/argopy/tests/test_related.py
@@ -0,0 +1,303 @@
+import pytest
+import tempfile
+import xarray as xr
+import pandas as pd
+from collections import ChainMap, OrderedDict
+import shutil
+
+from mocked_http import mocked_httpserver, mocked_server_address
+from utils import (
+    requires_matplotlib,
+    requires_cartopy,
+    requires_oops,
+    has_matplotlib,
+    has_cartopy,
+    has_ipython,
+)
+from argopy.related import (
+    TopoFetcher,
+    ArgoNVSReferenceTables,
+    OceanOPSDeployments,
+    ArgoDocs,
+)
+from argopy.utilities import (
+    is_list_of_strings,
+)
+
+if has_matplotlib:
+    import matplotlib as mpl
+
+if has_cartopy:
+    import cartopy
+
+if has_ipython:
+    import IPython
+
+
+class Test_TopoFetcher():
+    box = [81, 123, -67, -54]
+
+    def setup_class(self):
+        """setup any state specific to the execution of the given class"""
+        # Create the cache folder here, so that it's not the same for the pandas and pyarrow tests
+        self.cachedir = tempfile.mkdtemp()
+
+    def teardown_class(self):
+        """Cleanup once we are finished."""
+        def remove_test_dir():
+            shutil.rmtree(self.cachedir)
+        remove_test_dir()
+
+    def make_a_fetcher(self, cached=False):
+        opts = {'ds': 'gebco', 'stride': [10, 10], 'server': mocked_server_address}
+        if cached:
+            opts = ChainMap(opts, {'cache': True, 'cachedir': self.cachedir})
+        return TopoFetcher(self.box, **opts)
+
+    def assert_fetcher(self, f):
+        ds = f.to_xarray()
+        assert isinstance(ds, xr.Dataset)
+        assert 'elevation' in ds.data_vars
+
+    def test_load_mocked_server(self, mocked_httpserver):
+        """This will easily ensure that the module scope fixture is available to all methods !"""
+        assert True
+
+    params = [True, False]
+    ids_params = ["cached=%s" % p for p in params]
+    @pytest.mark.parametrize("params", params, indirect=False, ids=ids_params)
+    def test_fetching(self, params):
+        fetcher = self.make_a_fetcher(cached=params)
+        self.assert_fetcher(fetcher)
+
+
+class Test_ArgoNVSReferenceTables:
+
+    def setup_class(self):
+        """setup any state specific to the execution of the given class"""
+        # Create the cache folder here, so that it's not the same for the pandas and pyarrow tests
+        self.cachedir = tempfile.mkdtemp()
+        self.nvs = ArgoNVSReferenceTables(cache=True, cachedir=self.cachedir, nvs=mocked_server_address)
+
+    def teardown_class(self):
+        """Cleanup once we are finished."""
+        def remove_test_dir():
+            shutil.rmtree(self.cachedir)
+        remove_test_dir()
+
+    def test_load_mocked_server(self, mocked_httpserver):
+        """This will easily ensure that the module scope fixture is available to all methods !"""
+        assert True
+
+    def test_valid_ref(self):
+        assert is_list_of_strings(self.nvs.valid_ref)
+
+    opts = [3, 'R09']
+    opts_ids = ["rtid is a %s" % type(o) for o in opts]
+    @pytest.mark.parametrize("opts", opts, indirect=False, ids=opts_ids)
+    def test_tbl(self, opts):
+        assert isinstance(self.nvs.tbl(opts), pd.DataFrame)
+
+    opts = [3, 'R09']
+    opts_ids = ["rtid is a %s" % type(o) for o in opts]
+    @pytest.mark.parametrize("opts", opts, indirect=False, ids=opts_ids)
+    def test_tbl_name(self, opts):
+        names = self.nvs.tbl_name(opts)
+        assert isinstance(names, tuple)
+        assert isinstance(names[0], str)
+        assert isinstance(names[1], str)
+        assert isinstance(names[2], str)
+
+    def test_all_tbl(self):
+        all = self.nvs.all_tbl
+        assert isinstance(all, OrderedDict)
+        assert isinstance(all[list(all.keys())[0]], pd.DataFrame)
+
+    def test_all_tbl_name(self):
+        all = self.nvs.all_tbl_name
+        assert isinstance(all, OrderedDict)
+        assert isinstance(all[list(all.keys())[0]], tuple)
+
+    opts = ["ld+json", "rdf+xml", "text/turtle", "invalid"]
+    opts_ids = ["fmt=%s" % o for o in opts]
+    @pytest.mark.parametrize("opts", opts, indirect=False, ids=opts_ids)
+    def test_get_url(self, opts):
+        if opts != 'invalid':
+            url = self.nvs.get_url(3, fmt=opts)
+            assert isinstance(url, str)
+            if "json" in opts:
+                data = self.nvs.fs.open_json(url)
+                assert isinstance(data, dict)
+            elif "xml" in opts:
+                data = self.nvs.fs.fs.cat_file(url)
+                assert data[0:5] == b'<?xml'
+            else:
+                # log.debug(self.nvs.fs.fs.info(url))
+                data = self.nvs.fs.fs.cat_file(url)
+                assert data[0:7] == b'@prefix'
+        else:
+            with pytest.raises(ValueError):
+                self.nvs.get_url(3, fmt=opts)
+
+
+@requires_oops
+class Test_OceanOPSDeployments:
+
+    # scenarios generation can't be automated because of the None/True combination of arguments.
+    # If box=None and deployed_only=True, OceanOPSDeployments will seek for OPERATING floats deployed today ! which is
+    # impossible and if it happens it's due to an error in the database...
+    scenarios = [
+        # (None, True),  # This often lead to an empty dataframe !
+        # (None, False),  # Can't be handled by the mocked server (test date is surely different from the test data date)
+        # ([-90, 0, 0, 90], True),
+        # ([-90, 0, 0, 90], False),  # Can't be handled by the mocked server (test date is surely different from the test data date)
+        ([-90, 0, 0, 90, '2022-01'], True),
+        ([-90, 0, 0, 90, '2022-01'], False),
+        ([None, 0, 0, 90, '2022-01-01', '2023-01-01'], True),
+        ([None, 0, 0, 90, '2022-01-01', '2023-01-01'], False),
+        ([-90, None, 0, 90, '2022-01-01', '2023-01-01'], True),
+        ([-90, None, 0, 90, '2022-01-01', '2023-01-01'], False),
+        ([-90, 0, None, 90, '2022-01-01', '2023-01-01'], True),
+        ([-90, 0, None, 90, '2022-01-01', '2023-01-01'], False),
+        ([-90, 0, 0, None, '2022-01-01', '2023-01-01'], True),
+        ([-90, 0, 0, None, '2022-01-01', '2023-01-01'], False),
+        ([-90, 0, 0, 90, None, '2023-01-01'], True),
+        ([-90, 0, 0, 90, None, '2023-01-01'], False),
+        ([-90, 0, 0, 90, '2022-01-01', None], True),
+        ([-90, 0, 0, 90, '2022-01-01', None], False)]
+    scenarios_ids = ["%s, %s" % (opt[0], opt[1]) for opt in scenarios]
+
+    @pytest.fixture
+    def an_instance(self, request):
+        """ Fixture to create a OceanOPS_Deployments instance for a given set of arguments """
+        if isinstance(request.param, tuple):
+            box = request.param[0]
+            deployed_only = request.param[1]
+        else:
+            box = request.param
+            deployed_only = None
+
+        args = {"box": box, "deployed_only": deployed_only}
+        oops = OceanOPSDeployments(**args)
+
+        # Adjust server info to use the mocked HTTP server:
+        oops.api = mocked_server_address
+        oops.model = 'data/platform'
+
+        return oops
+
+    def test_load_mocked_server(self, mocked_httpserver):
+        """This will easily ensure that the module scope fixture is available to all methods !"""
+        assert True
+
+    @pytest.mark.parametrize("an_instance", scenarios, indirect=True, ids=scenarios_ids)
+    def test_init(self, an_instance):
+        assert isinstance(an_instance, OceanOPSDeployments)
+
+    @pytest.mark.parametrize("an_instance", scenarios, indirect=True, ids=scenarios_ids)
+    def test_attributes(self, an_instance):
+        dep = an_instance
+        assert isinstance(dep.uri, str)
+        assert isinstance(dep.uri_decoded, str)
+        assert isinstance(dep.status_code, pd.DataFrame)
+        assert isinstance(dep.box_name, str)
+        assert len(dep.box) == 6
+
+    @pytest.mark.parametrize("an_instance", scenarios, indirect=True, ids=scenarios_ids)
+    def test_to_dataframe(self, an_instance):
+        assert isinstance(an_instance.to_dataframe(), pd.DataFrame)
+
+    @pytest.mark.parametrize("an_instance", scenarios, indirect=True, ids=scenarios_ids)
+    @requires_matplotlib
+    @requires_cartopy
+    def test_plot_status(self, an_instance):
+        fig, ax = an_instance.plot_status()
+        assert isinstance(fig, mpl.figure.Figure)
+        assert isinstance(ax, cartopy.mpl.geoaxes.GeoAxesSubplot)
+
+
+class Test_ArgoDocs:
+
+    @pytest.fixture
+    def an_instance(self, request):
+        """ Fixture to create a ArgoDocs instance for a given set of arguments """
+        docid = request.param
+
+        Ad = ArgoDocs(docid=docid, cache=False)
+
+        # Adjust server info to use the mocked HTTP server:
+        Ad._doiserver = mocked_server_address
+        Ad._archimer = mocked_server_address
+
+        return Ad
+
+    def test_load_mocked_server(self, mocked_httpserver):
+        """This will easily ensure that the module scope fixture is available to all methods !"""
+        assert True
+
+    @pytest.mark.parametrize("an_instance", [None], indirect=True, ids=["docid=%s" % t for t in [None]])
+    def test_list(self, an_instance):
+        assert isinstance(an_instance.list, pd.DataFrame)
+
+    @pytest.mark.parametrize("an_instance", [None, 35385, '10.13155/46202'], indirect=True,
+                             ids=["docid=%s" % t for t in [None, 35385, '10.13155/46202']])
+    def test_init(self, an_instance):
+        assert isinstance(an_instance, ArgoDocs)
+        assert isinstance(an_instance.__repr__(), str)
+
+    @pytest.mark.parametrize("docid", [12, 'dummy'], indirect=False, ids=["docid=%s" % t for t in [12, 'dummy']])
+    def test_init_with_error(self, docid):
+        with pytest.raises(ValueError):
+            ArgoDocs(docid)
+
+    @pytest.mark.parametrize("where", ['title', 'abstract'], indirect=False,
+                             ids=["where=%s" % t for t in ['title', 'abstract']])
+    @pytest.mark.parametrize("an_instance", [None], indirect=True, ids=["docid=%s" % t for t in [None]])
+    def test_search(self, where, an_instance):
+        txt = "CDOM"
+        results = an_instance.search(txt, where=where)
+        assert isinstance(results, list)
+
+    @pytest.mark.parametrize("an_instance", [None, 35385], indirect=True, ids=["docid=%s" % t for t in [None, 35385]])
+    def test_js(self, an_instance):
+        if an_instance.docid is not None:
+            assert isinstance(an_instance.js, dict)
+        else:
+            with pytest.raises(ValueError):
+                an_instance.js
+
+    @pytest.mark.parametrize("an_instance", [None, 35385], indirect=True, ids=["docid=%s" % t for t in [None, 35385]])
+    def test_properties(self, an_instance):
+        if an_instance.docid is not None:
+            ris = an_instance.ris  # Fetch RIS metadata for this document
+            abstract = an_instance.abstract
+            assert isinstance(ris, dict)
+            assert 'AB' in ris  # must have an abstract
+            assert 'UR' in ris  # must have an url
+            assert isinstance(abstract, str)
+        else:
+            with pytest.raises(ValueError):
+                an_instance.ris
+            with pytest.raises(ValueError):
+                an_instance.abstract
+
+    @pytest.mark.parametrize("an_instance", [None, 35385], indirect=True, ids=["docid=%s" % t for t in [None, 35385]])
+    def test_show(self, an_instance):
+        if an_instance.docid is not None:
+            if has_ipython:
+                assert isinstance(an_instance.show(), IPython.core.display.HTML)
+                assert isinstance(an_instance.show(height=120), IPython.core.display.HTML)
+            else:
+                pytest.skip("Requires IPython")
+        else:
+            with pytest.raises(ValueError):
+                an_instance.show()
+
+    @pytest.mark.parametrize("page", [None, 12], indirect=False, ids=["page=%s" % t for t in [None, 12]])
+    @pytest.mark.parametrize("an_instance", [None, 35385], indirect=True, ids=["docid=%s" % t for t in [None, 35385]])
+    def test_open_pdf(self, page, an_instance):
+        if an_instance.docid is not None:
+            assert isinstance(an_instance.open_pdf(url_only=True, page=page), str)
+        else:
+            with pytest.raises(ValueError):
+                an_instance.show()
diff --git a/argopy/tests/test_utilities.py b/argopy/tests/test_utilities.py
index 3c14bcd5..24d37cb5 100644
--- a/argopy/tests/test_utilities.py
+++ b/argopy/tests/test_utilities.py
@@ -6,8 +6,6 @@
 import pandas as pd
 import numpy as np
 import types
-from collections import ChainMap, OrderedDict
-import shutil
 
 import argopy
 from argopy.utilities import (
@@ -31,15 +29,11 @@
     modified_environ,
     wrap_longitude,
     toYearFraction, YearFraction_to_datetime,
-    TopoFetcher,
     argo_split_path,
     Registry,
     float_wmo,
     get_coriolis_profile_id,
     get_ea_profile_page,
-    ArgoNVSReferenceTables,
-    OceanOPSDeployments,
-    ArgoDocs,
 )
 from argopy.errors import InvalidFetcherAccessPoint, FtpPathError
 from argopy import DataFetcher as ArgoDataFetcher
@@ -47,23 +41,9 @@
     requires_connection,
     requires_erddap,
     requires_gdac,
-    requires_matplotlib,
-    requires_cartopy,
-    requires_oops,
-    has_matplotlib,
-    has_cartopy,
-    has_ipython,
 )
 from mocked_http import mocked_httpserver, mocked_server_address
 
-if has_matplotlib:
-    import matplotlib as mpl
-
-if has_cartopy:
-    import cartopy
-
-if has_ipython:
-    import IPython
 
 def test_invalid_dictionnary():
     with pytest.raises(ValueError):
@@ -637,43 +617,6 @@ def test_YearFraction_to_datetime():
     assert YearFraction_to_datetime(2020+1) == pd.to_datetime('202101010000')
 
 
-class Test_TopoFetcher():
-    box = [81, 123, -67, -54]
-
-    def setup_class(self):
-        """setup any state specific to the execution of the given class"""
-        # Create the cache folder here, so that it's not the same for the pandas and pyarrow tests
-        self.cachedir = tempfile.mkdtemp()
-
-    def teardown_class(self):
-        """Cleanup once we are finished."""
-        def remove_test_dir():
-            shutil.rmtree(self.cachedir)
-        remove_test_dir()
-
-    def make_a_fetcher(self, cached=False):
-        opts = {'ds': 'gebco', 'stride': [10, 10], 'server': mocked_server_address}
-        if cached:
-            opts = ChainMap(opts, {'cache': True, 'cachedir': self.cachedir})
-        return TopoFetcher(self.box, **opts)
-
-    def assert_fetcher(self, f):
-        ds = f.to_xarray()
-        assert isinstance(ds, xr.Dataset)
-        assert 'elevation' in ds.data_vars
-
-    def test_load_mocked_server(self, mocked_httpserver):
-        """This will easily ensure that the module scope fixture is available to all methods !"""
-        assert True
-
-    params = [True, False]
-    ids_params = ["cached=%s" % p for p in params]
-    @pytest.mark.parametrize("params", params, indirect=False, ids=ids_params)
-    def test_fetching(self, params):
-        fetcher = self.make_a_fetcher(cached=params)
-        self.assert_fetcher(fetcher)
-
-
 class Test_argo_split_path:
     #############
     # UTILITIES #
@@ -814,233 +757,3 @@ def test_get_coriolis_profile_id(params, mocked_httpserver):
 def test_get_ea_profile_page(params, mocked_httpserver):
     with argopy.set_options(cachedir=tempfile.mkdtemp()):
         assert is_list_of_strings(get_ea_profile_page(params[0], params[1], api_server=mocked_server_address))
-
-
-class Test_ArgoNVSReferenceTables:
-
-    def setup_class(self):
-        """setup any state specific to the execution of the given class"""
-        # Create the cache folder here, so that it's not the same for the pandas and pyarrow tests
-        self.cachedir = tempfile.mkdtemp()
-        self.nvs = ArgoNVSReferenceTables(cache=True, cachedir=self.cachedir, nvs=mocked_server_address)
-
-    def teardown_class(self):
-        """Cleanup once we are finished."""
-        def remove_test_dir():
-            shutil.rmtree(self.cachedir)
-        remove_test_dir()
-
-    def test_load_mocked_server(self, mocked_httpserver):
-        """This will easily ensure that the module scope fixture is available to all methods !"""
-        assert True
-
-    def test_valid_ref(self):
-        assert is_list_of_strings(self.nvs.valid_ref)
-
-    opts = [3, 'R09']
-    opts_ids = ["rtid is a %s" % type(o) for o in opts]
-    @pytest.mark.parametrize("opts", opts, indirect=False, ids=opts_ids)
-    def test_tbl(self, opts):
-        assert isinstance(self.nvs.tbl(opts), pd.DataFrame)
-
-    opts = [3, 'R09']
-    opts_ids = ["rtid is a %s" % type(o) for o in opts]
-    @pytest.mark.parametrize("opts", opts, indirect=False, ids=opts_ids)
-    def test_tbl_name(self, opts):
-        names = self.nvs.tbl_name(opts)
-        assert isinstance(names, tuple)
-        assert isinstance(names[0], str)
-        assert isinstance(names[1], str)
-        assert isinstance(names[2], str)
-
-    def test_all_tbl(self):
-        all = self.nvs.all_tbl
-        assert isinstance(all, OrderedDict)
-        assert isinstance(all[list(all.keys())[0]], pd.DataFrame)
-
-    def test_all_tbl_name(self):
-        all = self.nvs.all_tbl_name
-        assert isinstance(all, OrderedDict)
-        assert isinstance(all[list(all.keys())[0]], tuple)
-
-    opts = ["ld+json", "rdf+xml", "text/turtle", "invalid"]
-    opts_ids = ["fmt=%s" % o for o in opts]
-    @pytest.mark.parametrize("opts", opts, indirect=False, ids=opts_ids)
-    def test_get_url(self, opts):
-        if opts != 'invalid':
-            url = self.nvs.get_url(3, fmt=opts)
-            assert isinstance(url, str)
-            if "json" in opts:
-                data = self.nvs.fs.open_json(url)
-                assert isinstance(data, dict)
-            elif "xml" in opts:
-                data = self.nvs.fs.fs.cat_file(url)
-                assert data[0:5] == b'<?xml'
-            else:
-                # log.debug(self.nvs.fs.fs.info(url))
-                data = self.nvs.fs.fs.cat_file(url)
-                assert data[0:7] == b'@prefix'
-        else:
-            with pytest.raises(ValueError):
-                self.nvs.get_url(3, fmt=opts)
-
-
-@requires_oops
-class Test_OceanOPSDeployments:
-
-    # scenarios generation can't be automated because of the None/True combination of arguments.
-    # If box=None and deployed_only=True, OceanOPSDeployments will seek for OPERATING floats deployed today ! which is
-    # impossible and if it happens it's due to an error in the database...
-    scenarios = [
-        # (None, True),  # This often lead to an empty dataframe !
-        # (None, False),  # Can't be handled by the mocked server (test date is surely different from the test data date)
-        # ([-90, 0, 0, 90], True),
-        # ([-90, 0, 0, 90], False),  # Can't be handled by the mocked server (test date is surely different from the test data date)
-        ([-90, 0, 0, 90, '2022-01'], True),
-        ([-90, 0, 0, 90, '2022-01'], False),
-        ([None, 0, 0, 90, '2022-01-01', '2023-01-01'], True),
-        ([None, 0, 0, 90, '2022-01-01', '2023-01-01'], False),
-        ([-90, None, 0, 90, '2022-01-01', '2023-01-01'], True),
-        ([-90, None, 0, 90, '2022-01-01', '2023-01-01'], False),
-        ([-90, 0, None, 90, '2022-01-01', '2023-01-01'], True),
-        ([-90, 0, None, 90, '2022-01-01', '2023-01-01'], False),
-        ([-90, 0, 0, None, '2022-01-01', '2023-01-01'], True),
-        ([-90, 0, 0, None, '2022-01-01', '2023-01-01'], False),
-        ([-90, 0, 0, 90, None, '2023-01-01'], True),
-        ([-90, 0, 0, 90, None, '2023-01-01'], False),
-        ([-90, 0, 0, 90, '2022-01-01', None], True),
-        ([-90, 0, 0, 90, '2022-01-01', None], False)]
-    scenarios_ids = ["%s, %s" % (opt[0], opt[1]) for opt in scenarios]
-
-    @pytest.fixture
-    def an_instance(self, request):
-        """ Fixture to create a OceanOPS_Deployments instance for a given set of arguments """
-        if isinstance(request.param, tuple):
-            box = request.param[0]
-            deployed_only = request.param[1]
-        else:
-            box = request.param
-            deployed_only = None
-
-        args = {"box": box, "deployed_only": deployed_only}
-        oops = OceanOPSDeployments(**args)
-
-        # Adjust server info to use the mocked HTTP server:
-        oops.api = mocked_server_address
-        oops.model = 'data/platform'
-
-        return oops
-
-    def test_load_mocked_server(self, mocked_httpserver):
-        """This will easily ensure that the module scope fixture is available to all methods !"""
-        assert True
-
-    @pytest.mark.parametrize("an_instance", scenarios, indirect=True, ids=scenarios_ids)
-    def test_init(self, an_instance):
-        assert isinstance(an_instance, OceanOPSDeployments)
-
-    @pytest.mark.parametrize("an_instance", scenarios, indirect=True, ids=scenarios_ids)
-    def test_attributes(self, an_instance):
-        dep = an_instance
-        assert isinstance(dep.uri, str)
-        assert isinstance(dep.uri_decoded, str)
-        assert isinstance(dep.status_code, pd.DataFrame)
-        assert isinstance(dep.box_name, str)
-        assert len(dep.box) == 6
-
-    @pytest.mark.parametrize("an_instance", scenarios, indirect=True, ids=scenarios_ids)
-    def test_to_dataframe(self, an_instance):
-        assert isinstance(an_instance.to_dataframe(), pd.DataFrame)
-
-    @pytest.mark.parametrize("an_instance", scenarios, indirect=True, ids=scenarios_ids)
-    @requires_matplotlib
-    @requires_cartopy
-    def test_plot_status(self, an_instance):
-        fig, ax = an_instance.plot_status()
-        assert isinstance(fig, mpl.figure.Figure)
-        assert isinstance(ax, cartopy.mpl.geoaxes.GeoAxesSubplot)
-
-
-class Test_ArgoDocs:
-
-    @pytest.fixture
-    def an_instance(self, request):
-        """ Fixture to create a ArgoDocs instance for a given set of arguments """
-        docid = request.param
-
-        Ad = ArgoDocs(docid=docid, cache=False)
-
-        # Adjust server info to use the mocked HTTP server:
-        Ad._doiserver = mocked_server_address
-        Ad._archimer = mocked_server_address
-
-        return Ad
-
-    def test_load_mocked_server(self, mocked_httpserver):
-        """This will easily ensure that the module scope fixture is available to all methods !"""
-        assert True
-
-    @pytest.mark.parametrize("an_instance", [None], indirect=True, ids=["docid=%s" % t for t in [None]])
-    def test_list(self, an_instance):
-        assert isinstance(an_instance.list, pd.DataFrame)
-
-    @pytest.mark.parametrize("an_instance", [None, 35385, '10.13155/46202'], indirect=True, ids=["docid=%s" % t for t in [None, 35385, '10.13155/46202']])
-    def test_init(self, an_instance):
-        assert isinstance(an_instance, ArgoDocs)
-        assert isinstance(an_instance.__repr__(), str)
-
-    @pytest.mark.parametrize("docid", [12, 'dummy'], indirect=False, ids=["docid=%s" % t for t in [12, 'dummy']])
-    def test_init_with_error(self, docid):
-        with pytest.raises(ValueError):
-            ArgoDocs(docid)
-
-    @pytest.mark.parametrize("where", ['title', 'abstract'], indirect=False, ids=["where=%s" % t for t in ['title', 'abstract']])
-    @pytest.mark.parametrize("an_instance", [None], indirect=True, ids=["docid=%s" % t for t in [None]])
-    def test_search(self, where, an_instance):
-        txt = "CDOM"
-        results = an_instance.search(txt, where=where)
-        assert isinstance(results, list)
-
-    @pytest.mark.parametrize("an_instance", [None, 35385], indirect=True, ids=["docid=%s" % t for t in [None, 35385]])
-    def test_js(self, an_instance):
-        if an_instance.docid is not None:
-            assert isinstance(an_instance.js, dict)
-        else:
-            with pytest.raises(ValueError):
-                an_instance.js
-
-    @pytest.mark.parametrize("an_instance", [None, 35385], indirect=True, ids=["docid=%s" % t for t in [None, 35385]])
-    def test_properties(self, an_instance):
-        if an_instance.docid is not None:
-            ris = an_instance.ris  # Fetch RIS metadata for this document
-            abstract = an_instance.abstract
-            assert isinstance(ris, dict)
-            assert 'AB' in ris  # must have an abstract
-            assert 'UR' in ris  # must have an url
-            assert isinstance(abstract, str)
-        else:
-            with pytest.raises(ValueError):
-                an_instance.ris
-            with pytest.raises(ValueError):
-                an_instance.abstract
-
-    @pytest.mark.parametrize("an_instance", [None, 35385], indirect=True, ids=["docid=%s" % t for t in [None, 35385]])
-    def test_show(self, an_instance):
-        if an_instance.docid is not None:
-            if has_ipython:
-                assert isinstance(an_instance.show(), IPython.core.display.HTML)
-                assert isinstance(an_instance.show(height=120), IPython.core.display.HTML)
-            else:
-                pytest.skip("Requires IPython")
-        else:
-            with pytest.raises(ValueError):
-                an_instance.show()
-
-    @pytest.mark.parametrize("page", [None, 12], indirect=False, ids=["page=%s" % t for t in [None, 12]])
-    @pytest.mark.parametrize("an_instance", [None, 35385], indirect=True, ids=["docid=%s" % t for t in [None, 35385]])
-    def test_open_pdf(self, page, an_instance):
-        if an_instance.docid is not None:
-            assert isinstance(an_instance.open_pdf(url_only=True, page=page), str)
-        else:
-            with pytest.raises(ValueError):
-                an_instance.show()
\ No newline at end of file

From 975913fc87ab34c9130980ceb89590ad88e0af8a Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Wed, 6 Sep 2023 16:31:32 +0200
Subject: [PATCH 07/33] Update api-hidden.rst

---
 docs/api-hidden.rst | 60 ++++++++++++++++++++++-----------------------
 1 file changed, 30 insertions(+), 30 deletions(-)

diff --git a/docs/api-hidden.rst b/docs/api-hidden.rst
index c7c307da..ff4e968d 100644
--- a/docs/api-hidden.rst
+++ b/docs/api-hidden.rst
@@ -69,25 +69,9 @@
     argopy.utilities.isalive
     argopy.utilities.isAPIconnected
 
-    argopy.utilities.ArgoNVSReferenceTables
-    argopy.utilities.ArgoNVSReferenceTables.search
-    argopy.utilities.ArgoNVSReferenceTables.valid_ref
-    argopy.utilities.ArgoNVSReferenceTables.all_tbl
-    argopy.utilities.ArgoNVSReferenceTables.all_tbl_name
-    argopy.utilities.ArgoNVSReferenceTables.tbl
-    argopy.utilities.ArgoNVSReferenceTables.tbl_name
-
     argopy.utilities.groupby_remap
     argopy.utilities.linear_interpolation_remap
 
-    argopy.utilities.TopoFetcher.cname
-    argopy.utilities.TopoFetcher.define_constraints
-    argopy.utilities.TopoFetcher.get_url
-    argopy.utilities.TopoFetcher.load
-    argopy.utilities.TopoFetcher.to_xarray
-    argopy.utilities.TopoFetcher.cachepath
-    argopy.utilities.TopoFetcher.uri
-
     argopy.utilities.list_standard_variables
     argopy.utilities.list_multiprofile_file_variables
     argopy.utilities.load_dict
@@ -105,25 +89,41 @@
     argopy.utilities.get_coriolis_profile_id
     argopy.utilities.get_ea_profile_page
 
-    argopy.utilities.OceanOPSDeployments
-    argopy.utilities.OceanOPSDeployments.to_dataframe
-    argopy.utilities.OceanOPSDeployments.status_code
-
-    argopy.utilities.ArgoDocs
-    argopy.utilities.ArgoDocs.list
-    argopy.utilities.ArgoDocs.search
-    argopy.utilities.ArgoDocs.ris
-    argopy.utilities.ArgoDocs.abstract
-    argopy.utilities.ArgoDocs.pdf
-    argopy.utilities.ArgoDocs.open_pdf
-    argopy.utilities.ArgoDocs.show
-    argopy.utilities.ArgoDocs.js
-
     argopy.utilities.drop_variables_not_in_all_datasets
     argopy.utilities.fill_variables_not_in_all_datasets
 
     argopy.utils.compute.MyThreadPoolExecutor
 
+    argopy.related.TopoFetcher.cname
+    argopy.related.TopoFetcher.define_constraints
+    argopy.related.TopoFetcher.get_url
+    argopy.related.TopoFetcher.load
+    argopy.related.TopoFetcher.to_xarray
+    argopy.related.TopoFetcher.cachepath
+    argopy.related.TopoFetcher.uri
+
+    argopy.related.ArgoNVSReferenceTables
+    argopy.related.ArgoNVSReferenceTables.search
+    argopy.related.ArgoNVSReferenceTables.valid_ref
+    argopy.related.ArgoNVSReferenceTables.all_tbl
+    argopy.related.ArgoNVSReferenceTables.all_tbl_name
+    argopy.related.ArgoNVSReferenceTables.tbl
+    argopy.related.ArgoNVSReferenceTables.tbl_name
+
+    argopy.related.OceanOPSDeployments
+    argopy.related.OceanOPSDeployments.to_dataframe
+    argopy.related.OceanOPSDeployments.status_code
+
+    argopy.related.ArgoDocs
+    argopy.related.ArgoDocs.list
+    argopy.related.ArgoDocs.search
+    argopy.related.ArgoDocs.ris
+    argopy.related.ArgoDocs.abstract
+    argopy.related.ArgoDocs.pdf
+    argopy.related.ArgoDocs.open_pdf
+    argopy.related.ArgoDocs.show
+    argopy.related.ArgoDocs.js
+
 
     argopy.plot
     argopy.plot.dashboard

From ec22c17fc809bdeb3475eb4f6f06cdf0d77a3999 Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Wed, 6 Sep 2023 16:37:19 +0200
Subject: [PATCH 08/33] update MyThreadPoolExecutor access [skip-ci]

---
 argopy/__init__.py                                   | 2 +-
 argopy/stores/filesystems.py                         | 2 +-
 argopy/utils/__init__.py                             | 7 +++++++
 argopy/utils/{compute.py => monitored_threadpool.py} | 6 +++---
 docs/api-hidden.rst                                  | 2 +-
 5 files changed, 13 insertions(+), 6 deletions(-)
 rename argopy/utils/{compute.py => monitored_threadpool.py} (99%)

diff --git a/argopy/__init__.py b/argopy/__init__.py
index 72602786..58a9fe29 100644
--- a/argopy/__init__.py
+++ b/argopy/__init__.py
@@ -39,7 +39,7 @@
 from .options import set_options, reset_options  # noqa: E402
 from .data_fetchers import CTDRefDataFetcher  # noqa: E402
 from .stores import ArgoIndex  # noqa: E402
-from .utils import compute  # noqa: E402, F401
+from .utils import monitored_threadpool  # noqa: E402, F401
 from .related import TopoFetcher, OceanOPSDeployments, ArgoNVSReferenceTables, ArgoDocs  # noqa: E402
 
 #
diff --git a/argopy/stores/filesystems.py b/argopy/stores/filesystems.py
index b37aedd9..aede839b 100644
--- a/argopy/stores/filesystems.py
+++ b/argopy/stores/filesystems.py
@@ -54,7 +54,7 @@
     drop_variables_not_in_all_datasets,
     fill_variables_not_in_all_datasets,
 )
-from ..utils.compute import MyThreadPoolExecutor as MyExecutor
+from ..utils import MyThreadPoolExecutor as MyExecutor
 
 
 log = logging.getLogger("argopy.stores")
diff --git a/argopy/utils/__init__.py b/argopy/utils/__init__.py
index e69de29b..c93ca7db 100644
--- a/argopy/utils/__init__.py
+++ b/argopy/utils/__init__.py
@@ -0,0 +1,7 @@
+from .monitored_threadpool import MyThreadPoolExecutor
+
+
+__all__ = (
+    # Classes:
+    "MyThreadPoolExecutor",
+)
diff --git a/argopy/utils/compute.py b/argopy/utils/monitored_threadpool.py
similarity index 99%
rename from argopy/utils/compute.py
rename to argopy/utils/monitored_threadpool.py
index 5b4a0385..5b637230 100644
--- a/argopy/utils/compute.py
+++ b/argopy/utils/monitored_threadpool.py
@@ -1,5 +1,5 @@
 """
-This sub-module provides utilities for miscellaneous computation tasks
+This sub-module provides utilities for miscellaneous computation tasks with multitheading
 
 We construct the MyThreadPoolExecutor class,
 we create a series of classes using multiple inheritance to implement monitoring features
@@ -527,13 +527,13 @@ class c(proto_MonitoredPoolExecutor_terminal):
 
 class MyThreadPoolExecutor(c):
     """
-    This is a low-level helper class not intended to be used directly.
+    This is a low-level helper class not intended to be used directly by users
 
     Examples
     --------
     ::
 
-        from argopy.utils.compute import MyThreadPoolExecutor as MyExecutor
+        from argopy.utils import MyThreadPoolExecutor as MyExecutor
         from random import random
         from time import sleep
         import numpy as np
diff --git a/docs/api-hidden.rst b/docs/api-hidden.rst
index ff4e968d..67b13130 100644
--- a/docs/api-hidden.rst
+++ b/docs/api-hidden.rst
@@ -92,7 +92,7 @@
     argopy.utilities.drop_variables_not_in_all_datasets
     argopy.utilities.fill_variables_not_in_all_datasets
 
-    argopy.utils.compute.MyThreadPoolExecutor
+    argopy.utils.MyThreadPoolExecutor
 
     argopy.related.TopoFetcher.cname
     argopy.related.TopoFetcher.define_constraints

From 44025d2e49bc3b6472356883ecd95e2cd86ecdbc Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Thu, 7 Sep 2023 08:30:35 +0200
Subject: [PATCH 09/33] Update __init__.py

---
 argopy/related/__init__.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/argopy/related/__init__.py b/argopy/related/__init__.py
index 87520fa9..84c62f22 100644
--- a/argopy/related/__init__.py
+++ b/argopy/related/__init__.py
@@ -2,7 +2,7 @@
 from .ocean_ops_deployments import OceanOPSDeployments
 from .reference_tables import ArgoNVSReferenceTables
 from .argo_documentation import ArgoDocs
-from .gdac_snapshot import ArgoDOI
+from .doi_snapshot import ArgoDOI
 
 
 #

From 6891cbd9acd767e2341d57031fda0340163efcf5 Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Thu, 7 Sep 2023 08:30:42 +0200
Subject: [PATCH 10/33] Delete gdac_snapshot.py

---
 argopy/related/gdac_snapshot.py | 389 --------------------------------
 1 file changed, 389 deletions(-)
 delete mode 100644 argopy/related/gdac_snapshot.py

diff --git a/argopy/related/gdac_snapshot.py b/argopy/related/gdac_snapshot.py
deleted file mode 100644
index 6c46b417..00000000
--- a/argopy/related/gdac_snapshot.py
+++ /dev/null
@@ -1,389 +0,0 @@
-import pandas as pd
-import numpy as np
-import warnings
-from typing import Union
-
-# from matplotlib.colors import to_hex
-# from IPython.display import IFrame
-
-from ..stores import httpstore
-
-
-class DOIrecord:
-    """Helper class for an Argo GDAC snapshot DOI record
-
-    Examples
-    --------
-    d = DOIrecord()
-    d = DOIrecord('42182')
-    d = DOIrecord('42182#103075')
-    d = DOIrecord(hashtag='103075')
-    d = DOIrecord(hashtag='103088')
-
-    d.doi
-    d.dx
-    d.isvalid
-    d.date
-    d.network
-    d.data
-    d.file
-
-    """
-    root = ""
-
-    def __init__(
-        self,
-        doi: str = "10.17882/42182",
-        hashtag: str = None,
-        fs: httpstore = None,
-        autoload: bool = True,
-        api_root: str = "https://www.seanoe.org/api/",
-    ):
-        self.api_root = api_root
-        self._fs = fs  # A httpstore will be created if necessary if self.load() is called
-        self._data = None
-
-        self._doi = doi
-        self._hashtag = hashtag
-        if "#" in doi:
-            self._doi = doi.split("#")[0]
-            self._hashtag = doi.split("#")[-1]
-
-        if autoload:
-            self.load()
-
-    @property
-    def doi(self) -> str:
-        """DOI component (without hashtag)"""
-        return self._doi
-
-    @property
-    def hashtag(self) -> str:
-        """Hashtag of the full doi"""
-        return self._hashtag
-
-    @property
-    def dx(self) -> str:
-        """DOI url"""
-        return "https:/dx.doi.org/%s" % str(self)
-
-    def isvalid(self) -> bool:
-        return "42182" in self.doi
-
-    @property
-    def data(self) -> dict:
-        """ "Internal DOI record data
-
-        Trigger data (down)load if not available
-        """
-        if self._data is None:
-            self.load()
-        return self._data
-
-    @property
-    def date(self) -> pd.Timestamp:
-        """Date associated with the DOI record"""
-        return self.data["date"]
-
-    @property
-    def network(self) -> str:
-        """Network of the Argo data pointed by the DOI
-
-        Returns
-        -------
-        str: 'core+BGC+deep' or 'BGC'
-        """
-        return "BGC" if "BGC" in self.data["title"] else "core+BGC+deep"
-
-    @property
-    def file(self) -> list:
-        """Return a pretty list of files properties associated with this DOI"""
-        results = []
-        for f in self.data["files"]:
-            r = {"openAccess": bool(f["openAccess"])}
-            if bool(f["openAccess"]):
-                r["path"] = f["fileUrl"]
-            else:
-                r["path"] = None
-            r["update"] = pd.to_datetime(f["lastUpdateDate"])
-            r["date"] = pd.to_datetime(f["fragment"]["date"])
-            r["size"] = f["size"]
-            r["network"] = "BGC" if "BGC" in f["fragment"]["title"] else "core+BGC+deep"
-            results.append(r)
-        return results
-
-    @property
-    def uri(self) -> str:
-        """url to API call to retrieve DOI data"""
-        if self.hashtag is None:
-            url = "find-by-id/{id}".format
-        else:
-            url = "find-by-fragment/{id}?fragmentId={hashtag}".format
-        return self.api_root + url(id=self.doi.split("/")[-1], hashtag=self.hashtag)
-
-    def __str__(self):
-        # txt = "%s/%s" % (self.root, self.doi)
-        txt = "%s" % (self.doi)
-        if self.hashtag is not None:
-            txt = "%s#%s" % (txt, self._hashtag)
-        return txt
-
-    def _process_data(self, data: dict) -> dict:
-        """Synthetic dict from data return by API"""
-        Nfiles = len(data["files"])
-        if Nfiles > 1:
-            # Sort files resources by date (most recent first)
-            data["files"].sort(
-                key=lambda x: x.get("fragment").get("date"), reverse=True
-            )
-
-        return {
-            "title": data["title"]["en"],
-            "date": pd.to_datetime(data["date"]),
-            "authors": data["authors"],
-            "files": data["files"],
-            "Nfiles": Nfiles,
-            # 'description': data['description'],
-            # 'keywords': data['keywords'],
-            # 'licenceUrl': data['licenceUrl'],
-        }
-
-    def load(self, cache: bool = False):
-        """Load DOI record data from API call"""
-        if self._data is None:
-            if self._fs is None:
-                self._fs = httpstore(cache=cache)
-
-            data = self._fs.open_json(self.uri)
-            self._data = self._process_data(data)
-
-        return self
-
-    def from_dict(self, d: dict):
-        """Load DOI record data from a dictionary"""
-        if (
-            "title" in d
-            and "en" in d["title"]
-            and "date" in d
-            and "authors" in d
-            and "files" in d
-        ):
-            self._data = self._process_data(d)
-        return self
-
-    def search(self, **kwargs):
-        raise ValueError("")
-
-    def _repr_file(self, file, with_label=False) -> str:
-        """Return a pretty string from a single file dict"""
-        def sizeof_fmt(num, suffix="B"):
-            for unit in ("", "Ki", "Mi", "Gi", "Ti", "Pi", "Ei", "Zi"):
-                if abs(num) < 1024.0:
-                    return f"{num:3.1f}{unit}{suffix}"
-                num /= 1024.0
-            return f"{num:.1f}Yi{suffix}"
-
-        summary = []
-        if with_label:
-            summary.append("%s" % file["label"]["en"])
-
-        if bool(file["openAccess"]):
-            summary.append("%s" % file["fileUrl"])
-        else:
-            summary.append("%s" % file["fileName"])
-
-        attrs = []
-        attrs.append("%s" % sizeof_fmt(file["size"]))
-        attrs.append("openAccess=%s" % file["openAccess"])
-        summary.append("(%s)" % (", ".join(attrs)))
-
-        return " ".join(summary)
-
-    def __repr__(self):
-        summary = ["<argopy.DOIrecord>"]
-        summary.append("DOI: %s" % self.__str__())
-        if self._data is not None:
-            summary.append("Title: %s" % self.data["title"])
-            summary.append("Date: %s" % self.date.strftime("%Y-%m-%d"))
-            summary.append("Network: %s" % self.network)
-
-            if self.data["Nfiles"] == 1:
-                summary.append("File: %s" % self._repr_file(self.data["files"][0]))
-            else:
-                summary.append("File: %i files in total" % (self.data["Nfiles"]))
-
-                summary.append("Files for core+BGC+deep:")
-                ifound = 0
-                for ii, f in enumerate(self.data["files"]):
-                    if "BGC" not in f["fragment"]["title"] and ifound < 10:
-                        summary.append(
-                            "     - #%s %s"
-                            % (f["id"], self._repr_file(f, with_label=True))
-                        )
-                        ifound += 1
-
-                summary.append("Files for BGC only:")
-                ifound = 0
-                for ii, f in enumerate(self.data["files"]):
-                    if "BGC" in f["fragment"]["title"] and ifound < 10:
-                        summary.append(
-                            "     - #%s %s"
-                            % (f["id"], self._repr_file(f, with_label=True))
-                        )
-                        ifound += 1
-
-        return "\n".join(summary)
-
-    # @property
-    # def html(self) -> str:
-    #     fs = 12
-    #
-    #     def td_msg(bgcolor, txtcolor, txt):
-    #         style = "background-color:%s;" % to_hex(bgcolor, keep_alpha=True)
-    #         style += "border-width:0px;"
-    #         style += "padding: 2px 2px 2px 0px;"
-    #         style += "text-align:left;"
-    #         style += "color:%s" % to_hex(txtcolor, keep_alpha=True)
-    #         return "<td style='%s'>%s</td>" % (style, str(txt))
-    #
-    #     def td_a(bgcolor, txtcolor, txt, link):
-    #         style = "background-color:%s;" % to_hex(bgcolor, keep_alpha=True)
-    #         style += "border-width:0px;"
-    #         style += "padding: 2px 0px 2px 5px;"
-    #         style += "text-align:right;"
-    #         style += "color:%s" % to_hex(txtcolor, keep_alpha=True)
-    #         return "<td style='%s'><a href='%s'>%s</a></td>" % (style, link, str(txt))
-    #
-    #     td_empty = "<td style='border-width:0px;padding: 2px 5px 2px 5px;text-align:left'>&nbsp;</td>"
-    #
-    #     html = []
-    #     html.append(
-    #         "<table style='border-collapse:collapse;border-spacing:0;font-size:%ipx'>"
-    #         % fs
-    #     )
-    #     html.append("<tbody>")
-    #
-    #     rows = []
-    #
-    #     # 1st row:
-    #     cols = []
-    #     cols.append(td_msg("dimgray", "w", "doi: "))
-    #     cols.append(td_msg("green", "w", "%s/" % self.root))
-    #     cols.append(td_msg("yellowgreen", "w", self.doi))
-    #     if self.hashtag is not None:
-    #         cols.append(td_msg("darkorange", "w", "#%s" % self.hashtag))
-    #     cols.append(td_a("white", "w", "↗", self.dx))
-    #     cols.append(td_empty)
-    #     rows.append("<tr>%s</tr>" % "\n".join(cols))
-    #
-    #     #         # 2nd row (if data have been loaded):
-    #     #         if self._data is not None:
-    #     #             cols = []
-    #     #             cols.append(td_msg('dimgray', 'w', "Title: "))
-    #     #             cols.append(td_msg('white', 'w', "%s" % self.data['title']))
-    #     #             # cols.append(td_msg('yellowgreen', 'w', self.doi))
-    #     #             # if self.hashtag is not None:
-    #     #             #     cols.append(td_msg("darkorange", 'w', "#%s" % self.hashtag))
-    #     #             # cols.append(td_a("white", 'w', "↗", self.dx))
-    #     #             # cols.append(td_empty)
-    #     #             rows.append("<tr>%s</tr>" % "\n".join(cols))
-    #
-    #     #         print(rows)
-    #     #         # Fix colspan:
-    #     #         Nrows = np.max([len(r.split("<td ")) for r in rows])
-    #     #         print(Nrows)
-    #     #         rowss = []
-    #     #         for r in rows:
-    #     #             rowss.append(r.replace("<tr>", "<tr colspan='%i'>" % Nrows))
-    #     #         print(rowss)
-    #
-    #     # Finalize
-    #     html.append("\n".join(rows))
-    #     html.append("</tbody>")
-    #     html.append("</table>")
-    #     html = "\n".join(html)
-    #     return html
-
-    # def _repr_html_(self):
-    #     return self.html
-
-
-class ArgoDOI:
-    """Helper class for Argo GDAC snapshot DOI access and discovery
-
-    Examples
-    --------
-    from argopy import ArgoDOI
-
-    doi = ArgoDOI()  # If you don't know where to start, just load the primary Argo DOI record
-    doi = ArgoDOI('95141')  # To point directly to a snapshot ID
-    doi = ArgoDOI(hashtag='95141')
-    doi = ArgoDOI(fs=httpstore(cache=True))
-
-    doi.search('2020-02')  # Return doi closest to a given date
-    doi.search('2020-02', network='BGC')  # Return doi closest to a given date for a specific network
-
-    doi.file  # Easy to read list of file(s) associated with a DOI record
-    doi.dx  # http link toward DOI
-
-    """
-
-    def __init__(self,
-                 hashtag=None,
-                 fs=None,
-                 cache=True):
-        self._fs = fs if isinstance(fs, httpstore) else httpstore(cache=cache)
-        if hashtag is not None and '42182#' in hashtag:
-            hashtag = hashtag.split('42182#')[-1]
-        self._doi = DOIrecord(hashtag=hashtag, fs=self._fs, autoload=True)
-
-    @property
-    def doi(self) -> str:
-        """DOI component (without hashtag)"""
-        return str(self._doi)
-
-    def __repr__(self):
-        return self._doi.__repr__()
-
-    def dates(self, network: str = None) -> dict:
-        d = {}
-        if network == "BGC":
-            for f in self._doi.data["files"]:
-                if "BGC" in f["fragment"]["title"]:
-                    d.update({int(f["id"]): pd.to_datetime(f["fragment"]["date"])})
-        else:
-            for f in self._doi.data["files"]:
-                if "BGC" not in f["fragment"]["title"]:
-                    d.update({int(f["id"]): pd.to_datetime(f["fragment"]["date"])})
-        return d
-
-    def search(self, date: Union[str, pd.Timestamp], network: str = None) -> DOIrecord:
-        """Search DOI closest to a given date"""
-        dates = self.dates(network=network)
-        target = pd.to_datetime(date, utc=True)
-        close = list(dates.values())[
-            np.argmin(np.abs([target - dates[d] for d in dates]))
-        ]
-        found = [d for d in dates if dates[d] == close]
-        results = []
-        if len(found) > 0:
-            for f in found:
-                results.append(DOIrecord(hashtag=f, fs=self._fs))
-        if len(results) == 1:
-            if (close - target).days > 30:
-                warnings.warn(
-                    "This snapshot is more than 30 days off your search dates !"
-                )
-            return results[0]
-        else:
-            return results
-
-    @property
-    def file(self) -> list:
-        """Return a pretty list of files properties associated with this DOI"""
-        return self._doi.file
-
-    @property
-    def dx(self) -> str:
-        """DOI url"""
-        return self._doi.dx

From 8723078dbbf7dbceb6d78bfe1585c4ef6290043a Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Thu, 7 Sep 2023 08:30:48 +0200
Subject: [PATCH 11/33] Create doi_snapshot.py

---
 argopy/related/doi_snapshot.py | 389 +++++++++++++++++++++++++++++++++
 1 file changed, 389 insertions(+)
 create mode 100644 argopy/related/doi_snapshot.py

diff --git a/argopy/related/doi_snapshot.py b/argopy/related/doi_snapshot.py
new file mode 100644
index 00000000..6c46b417
--- /dev/null
+++ b/argopy/related/doi_snapshot.py
@@ -0,0 +1,389 @@
+import pandas as pd
+import numpy as np
+import warnings
+from typing import Union
+
+# from matplotlib.colors import to_hex
+# from IPython.display import IFrame
+
+from ..stores import httpstore
+
+
+class DOIrecord:
+    """Helper class for an Argo GDAC snapshot DOI record
+
+    Examples
+    --------
+    d = DOIrecord()
+    d = DOIrecord('42182')
+    d = DOIrecord('42182#103075')
+    d = DOIrecord(hashtag='103075')
+    d = DOIrecord(hashtag='103088')
+
+    d.doi
+    d.dx
+    d.isvalid
+    d.date
+    d.network
+    d.data
+    d.file
+
+    """
+    root = ""
+
+    def __init__(
+        self,
+        doi: str = "10.17882/42182",
+        hashtag: str = None,
+        fs: httpstore = None,
+        autoload: bool = True,
+        api_root: str = "https://www.seanoe.org/api/",
+    ):
+        self.api_root = api_root
+        self._fs = fs  # A httpstore will be created if necessary if self.load() is called
+        self._data = None
+
+        self._doi = doi
+        self._hashtag = hashtag
+        if "#" in doi:
+            self._doi = doi.split("#")[0]
+            self._hashtag = doi.split("#")[-1]
+
+        if autoload:
+            self.load()
+
+    @property
+    def doi(self) -> str:
+        """DOI component (without hashtag)"""
+        return self._doi
+
+    @property
+    def hashtag(self) -> str:
+        """Hashtag of the full doi"""
+        return self._hashtag
+
+    @property
+    def dx(self) -> str:
+        """DOI url"""
+        return "https:/dx.doi.org/%s" % str(self)
+
+    def isvalid(self) -> bool:
+        return "42182" in self.doi
+
+    @property
+    def data(self) -> dict:
+        """ "Internal DOI record data
+
+        Trigger data (down)load if not available
+        """
+        if self._data is None:
+            self.load()
+        return self._data
+
+    @property
+    def date(self) -> pd.Timestamp:
+        """Date associated with the DOI record"""
+        return self.data["date"]
+
+    @property
+    def network(self) -> str:
+        """Network of the Argo data pointed by the DOI
+
+        Returns
+        -------
+        str: 'core+BGC+deep' or 'BGC'
+        """
+        return "BGC" if "BGC" in self.data["title"] else "core+BGC+deep"
+
+    @property
+    def file(self) -> list:
+        """Return a pretty list of files properties associated with this DOI"""
+        results = []
+        for f in self.data["files"]:
+            r = {"openAccess": bool(f["openAccess"])}
+            if bool(f["openAccess"]):
+                r["path"] = f["fileUrl"]
+            else:
+                r["path"] = None
+            r["update"] = pd.to_datetime(f["lastUpdateDate"])
+            r["date"] = pd.to_datetime(f["fragment"]["date"])
+            r["size"] = f["size"]
+            r["network"] = "BGC" if "BGC" in f["fragment"]["title"] else "core+BGC+deep"
+            results.append(r)
+        return results
+
+    @property
+    def uri(self) -> str:
+        """url to API call to retrieve DOI data"""
+        if self.hashtag is None:
+            url = "find-by-id/{id}".format
+        else:
+            url = "find-by-fragment/{id}?fragmentId={hashtag}".format
+        return self.api_root + url(id=self.doi.split("/")[-1], hashtag=self.hashtag)
+
+    def __str__(self):
+        # txt = "%s/%s" % (self.root, self.doi)
+        txt = "%s" % (self.doi)
+        if self.hashtag is not None:
+            txt = "%s#%s" % (txt, self._hashtag)
+        return txt
+
+    def _process_data(self, data: dict) -> dict:
+        """Synthetic dict from data return by API"""
+        Nfiles = len(data["files"])
+        if Nfiles > 1:
+            # Sort files resources by date (most recent first)
+            data["files"].sort(
+                key=lambda x: x.get("fragment").get("date"), reverse=True
+            )
+
+        return {
+            "title": data["title"]["en"],
+            "date": pd.to_datetime(data["date"]),
+            "authors": data["authors"],
+            "files": data["files"],
+            "Nfiles": Nfiles,
+            # 'description': data['description'],
+            # 'keywords': data['keywords'],
+            # 'licenceUrl': data['licenceUrl'],
+        }
+
+    def load(self, cache: bool = False):
+        """Load DOI record data from API call"""
+        if self._data is None:
+            if self._fs is None:
+                self._fs = httpstore(cache=cache)
+
+            data = self._fs.open_json(self.uri)
+            self._data = self._process_data(data)
+
+        return self
+
+    def from_dict(self, d: dict):
+        """Load DOI record data from a dictionary"""
+        if (
+            "title" in d
+            and "en" in d["title"]
+            and "date" in d
+            and "authors" in d
+            and "files" in d
+        ):
+            self._data = self._process_data(d)
+        return self
+
+    def search(self, **kwargs):
+        raise ValueError("")
+
+    def _repr_file(self, file, with_label=False) -> str:
+        """Return a pretty string from a single file dict"""
+        def sizeof_fmt(num, suffix="B"):
+            for unit in ("", "Ki", "Mi", "Gi", "Ti", "Pi", "Ei", "Zi"):
+                if abs(num) < 1024.0:
+                    return f"{num:3.1f}{unit}{suffix}"
+                num /= 1024.0
+            return f"{num:.1f}Yi{suffix}"
+
+        summary = []
+        if with_label:
+            summary.append("%s" % file["label"]["en"])
+
+        if bool(file["openAccess"]):
+            summary.append("%s" % file["fileUrl"])
+        else:
+            summary.append("%s" % file["fileName"])
+
+        attrs = []
+        attrs.append("%s" % sizeof_fmt(file["size"]))
+        attrs.append("openAccess=%s" % file["openAccess"])
+        summary.append("(%s)" % (", ".join(attrs)))
+
+        return " ".join(summary)
+
+    def __repr__(self):
+        summary = ["<argopy.DOIrecord>"]
+        summary.append("DOI: %s" % self.__str__())
+        if self._data is not None:
+            summary.append("Title: %s" % self.data["title"])
+            summary.append("Date: %s" % self.date.strftime("%Y-%m-%d"))
+            summary.append("Network: %s" % self.network)
+
+            if self.data["Nfiles"] == 1:
+                summary.append("File: %s" % self._repr_file(self.data["files"][0]))
+            else:
+                summary.append("File: %i files in total" % (self.data["Nfiles"]))
+
+                summary.append("Files for core+BGC+deep:")
+                ifound = 0
+                for ii, f in enumerate(self.data["files"]):
+                    if "BGC" not in f["fragment"]["title"] and ifound < 10:
+                        summary.append(
+                            "     - #%s %s"
+                            % (f["id"], self._repr_file(f, with_label=True))
+                        )
+                        ifound += 1
+
+                summary.append("Files for BGC only:")
+                ifound = 0
+                for ii, f in enumerate(self.data["files"]):
+                    if "BGC" in f["fragment"]["title"] and ifound < 10:
+                        summary.append(
+                            "     - #%s %s"
+                            % (f["id"], self._repr_file(f, with_label=True))
+                        )
+                        ifound += 1
+
+        return "\n".join(summary)
+
+    # @property
+    # def html(self) -> str:
+    #     fs = 12
+    #
+    #     def td_msg(bgcolor, txtcolor, txt):
+    #         style = "background-color:%s;" % to_hex(bgcolor, keep_alpha=True)
+    #         style += "border-width:0px;"
+    #         style += "padding: 2px 2px 2px 0px;"
+    #         style += "text-align:left;"
+    #         style += "color:%s" % to_hex(txtcolor, keep_alpha=True)
+    #         return "<td style='%s'>%s</td>" % (style, str(txt))
+    #
+    #     def td_a(bgcolor, txtcolor, txt, link):
+    #         style = "background-color:%s;" % to_hex(bgcolor, keep_alpha=True)
+    #         style += "border-width:0px;"
+    #         style += "padding: 2px 0px 2px 5px;"
+    #         style += "text-align:right;"
+    #         style += "color:%s" % to_hex(txtcolor, keep_alpha=True)
+    #         return "<td style='%s'><a href='%s'>%s</a></td>" % (style, link, str(txt))
+    #
+    #     td_empty = "<td style='border-width:0px;padding: 2px 5px 2px 5px;text-align:left'>&nbsp;</td>"
+    #
+    #     html = []
+    #     html.append(
+    #         "<table style='border-collapse:collapse;border-spacing:0;font-size:%ipx'>"
+    #         % fs
+    #     )
+    #     html.append("<tbody>")
+    #
+    #     rows = []
+    #
+    #     # 1st row:
+    #     cols = []
+    #     cols.append(td_msg("dimgray", "w", "doi: "))
+    #     cols.append(td_msg("green", "w", "%s/" % self.root))
+    #     cols.append(td_msg("yellowgreen", "w", self.doi))
+    #     if self.hashtag is not None:
+    #         cols.append(td_msg("darkorange", "w", "#%s" % self.hashtag))
+    #     cols.append(td_a("white", "w", "↗", self.dx))
+    #     cols.append(td_empty)
+    #     rows.append("<tr>%s</tr>" % "\n".join(cols))
+    #
+    #     #         # 2nd row (if data have been loaded):
+    #     #         if self._data is not None:
+    #     #             cols = []
+    #     #             cols.append(td_msg('dimgray', 'w', "Title: "))
+    #     #             cols.append(td_msg('white', 'w', "%s" % self.data['title']))
+    #     #             # cols.append(td_msg('yellowgreen', 'w', self.doi))
+    #     #             # if self.hashtag is not None:
+    #     #             #     cols.append(td_msg("darkorange", 'w', "#%s" % self.hashtag))
+    #     #             # cols.append(td_a("white", 'w', "↗", self.dx))
+    #     #             # cols.append(td_empty)
+    #     #             rows.append("<tr>%s</tr>" % "\n".join(cols))
+    #
+    #     #         print(rows)
+    #     #         # Fix colspan:
+    #     #         Nrows = np.max([len(r.split("<td ")) for r in rows])
+    #     #         print(Nrows)
+    #     #         rowss = []
+    #     #         for r in rows:
+    #     #             rowss.append(r.replace("<tr>", "<tr colspan='%i'>" % Nrows))
+    #     #         print(rowss)
+    #
+    #     # Finalize
+    #     html.append("\n".join(rows))
+    #     html.append("</tbody>")
+    #     html.append("</table>")
+    #     html = "\n".join(html)
+    #     return html
+
+    # def _repr_html_(self):
+    #     return self.html
+
+
+class ArgoDOI:
+    """Helper class for Argo GDAC snapshot DOI access and discovery
+
+    Examples
+    --------
+    from argopy import ArgoDOI
+
+    doi = ArgoDOI()  # If you don't know where to start, just load the primary Argo DOI record
+    doi = ArgoDOI('95141')  # To point directly to a snapshot ID
+    doi = ArgoDOI(hashtag='95141')
+    doi = ArgoDOI(fs=httpstore(cache=True))
+
+    doi.search('2020-02')  # Return doi closest to a given date
+    doi.search('2020-02', network='BGC')  # Return doi closest to a given date for a specific network
+
+    doi.file  # Easy to read list of file(s) associated with a DOI record
+    doi.dx  # http link toward DOI
+
+    """
+
+    def __init__(self,
+                 hashtag=None,
+                 fs=None,
+                 cache=True):
+        self._fs = fs if isinstance(fs, httpstore) else httpstore(cache=cache)
+        if hashtag is not None and '42182#' in hashtag:
+            hashtag = hashtag.split('42182#')[-1]
+        self._doi = DOIrecord(hashtag=hashtag, fs=self._fs, autoload=True)
+
+    @property
+    def doi(self) -> str:
+        """DOI component (without hashtag)"""
+        return str(self._doi)
+
+    def __repr__(self):
+        return self._doi.__repr__()
+
+    def dates(self, network: str = None) -> dict:
+        d = {}
+        if network == "BGC":
+            for f in self._doi.data["files"]:
+                if "BGC" in f["fragment"]["title"]:
+                    d.update({int(f["id"]): pd.to_datetime(f["fragment"]["date"])})
+        else:
+            for f in self._doi.data["files"]:
+                if "BGC" not in f["fragment"]["title"]:
+                    d.update({int(f["id"]): pd.to_datetime(f["fragment"]["date"])})
+        return d
+
+    def search(self, date: Union[str, pd.Timestamp], network: str = None) -> DOIrecord:
+        """Search DOI closest to a given date"""
+        dates = self.dates(network=network)
+        target = pd.to_datetime(date, utc=True)
+        close = list(dates.values())[
+            np.argmin(np.abs([target - dates[d] for d in dates]))
+        ]
+        found = [d for d in dates if dates[d] == close]
+        results = []
+        if len(found) > 0:
+            for f in found:
+                results.append(DOIrecord(hashtag=f, fs=self._fs))
+        if len(results) == 1:
+            if (close - target).days > 30:
+                warnings.warn(
+                    "This snapshot is more than 30 days off your search dates !"
+                )
+            return results[0]
+        else:
+            return results
+
+    @property
+    def file(self) -> list:
+        """Return a pretty list of files properties associated with this DOI"""
+        return self._doi.file
+
+    @property
+    def dx(self) -> str:
+        """DOI url"""
+        return self._doi.dx

From 0b8c9d7da899fd4510ca00bfd57a16b50ac67c2f Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Thu, 7 Sep 2023 08:31:19 +0200
Subject: [PATCH 12/33] Refactor MyThreadPoolExecutor as
 MonitoredThreadPoolExecutor

---
 argopy/__init__.py           | 2 +-
 argopy/stores/filesystems.py | 2 +-
 argopy/utils/__init__.py     | 4 ++--
 3 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/argopy/__init__.py b/argopy/__init__.py
index 1abb83e6..8648d332 100644
--- a/argopy/__init__.py
+++ b/argopy/__init__.py
@@ -39,7 +39,7 @@
 from .options import set_options, reset_options  # noqa: E402
 from .data_fetchers import CTDRefDataFetcher  # noqa: E402
 from .stores import ArgoIndex  # noqa: E402
-from .utils import monitored_threadpool  # noqa: E402, F401
+from .utils import MonitoredThreadPoolExecutor  # noqa: E402, F401
 from .related import TopoFetcher, OceanOPSDeployments, ArgoNVSReferenceTables, ArgoDocs, ArgoDOI  # noqa: E402
 
 
diff --git a/argopy/stores/filesystems.py b/argopy/stores/filesystems.py
index aede839b..3e08cd3d 100644
--- a/argopy/stores/filesystems.py
+++ b/argopy/stores/filesystems.py
@@ -54,7 +54,7 @@
     drop_variables_not_in_all_datasets,
     fill_variables_not_in_all_datasets,
 )
-from ..utils import MyThreadPoolExecutor as MyExecutor
+from ..utils import MonitoredThreadPoolExecutor as MyExecutor
 
 
 log = logging.getLogger("argopy.stores")
diff --git a/argopy/utils/__init__.py b/argopy/utils/__init__.py
index c93ca7db..6408e29e 100644
--- a/argopy/utils/__init__.py
+++ b/argopy/utils/__init__.py
@@ -1,7 +1,7 @@
-from .monitored_threadpool import MyThreadPoolExecutor
+from .monitored_threadpool import MyThreadPoolExecutor as MonitoredThreadPoolExecutor
 
 
 __all__ = (
     # Classes:
-    "MyThreadPoolExecutor",
+    "MonitoredThreadPoolExecutor",
 )

From 01669bdcae308460541624a106ac725ad6f80fd0 Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Thu, 7 Sep 2023 08:50:11 +0200
Subject: [PATCH 13/33] refactor most checkers

---
 argopy/fetchers.py       |   4 +-
 argopy/utilities.py      | 380 +--------------------------------------
 argopy/utils/__init__.py |  15 +-
 argopy/utils/checkers.py | 377 ++++++++++++++++++++++++++++++++++++++
 4 files changed, 403 insertions(+), 373 deletions(-)
 create mode 100644 argopy/utils/checkers.py

diff --git a/argopy/fetchers.py b/argopy/fetchers.py
index da3143a7..50b142df 100755
--- a/argopy/fetchers.py
+++ b/argopy/fetchers.py
@@ -21,11 +21,13 @@
 from .utilities import (
     list_available_data_src,
     list_available_index_src,
+    get_coriolis_profile_id,
+)
+from .utils import (
     is_box,
     is_indexbox,
     check_wmo,
     check_cyc,
-    get_coriolis_profile_id,
 )
 from .plot import plot_trajectory, bar_plot, open_sat_altim_report
 
diff --git a/argopy/utilities.py b/argopy/utilities.py
index 831b05fb..396abe0b 100644
--- a/argopy/utilities.py
+++ b/argopy/utilities.py
@@ -56,6 +56,15 @@
     FileSystemHasNoCache,
     DataNotFound,
 )
+from .utils import (
+    is_box,
+    is_list_of_strings,
+    is_wmo, check_wmo,
+    check_cyc,
+)
+from .related import (
+    ArgoNVSReferenceTables,
+)
 
 try:
     collectionsAbc = collections.abc
@@ -1363,207 +1372,6 @@ def format_oneline(s, max_width=65):
         return s
 
 
-def is_indexbox(box: list, errors="raise"):
-    """ Check if this array matches a 2d or 3d index box definition
-
-    Argopy expects one of the following 2 format to define an index box:
-
-    - box = [lon_min, lon_max, lat_min, lat_max]
-    - box = [lon_min, lon_max, lat_min, lat_max, datim_min, datim_max]
-
-    This function check for this format compliance.
-
-    Parameters
-    ----------
-    box: list
-    errors: str, default='raise'
-
-    Returns
-    -------
-    bool
-    """
-    def is_dateconvertible(d):
-        try:
-            pd.to_datetime(d)
-            isit = True
-        except Exception:
-            isit = False
-        return isit
-
-    tests = {}
-
-    # Formats:
-    tests["index box must be a list"] = lambda b: isinstance(b, list)
-    tests["index box must be a list with 4 or 6 elements"] = lambda b: len(b) in [4, 6]
-
-    # Types:
-    tests["lon_min must be numeric"] = lambda b: (
-        isinstance(b[0], int) or isinstance(b[0], (np.floating, float))
-    )
-    tests["lon_max must be numeric"] = lambda b: (
-        isinstance(b[1], int) or isinstance(b[1], (np.floating, float))
-    )
-    tests["lat_min must be numeric"] = lambda b: (
-        isinstance(b[2], int) or isinstance(b[2], (np.floating, float))
-    )
-    tests["lat_max must be numeric"] = lambda b: (
-        isinstance(b[3], int) or isinstance(b[3], (np.floating, float))
-    )
-    if len(box) > 4:
-        tests[
-            "datetim_min must be a string convertible to a Pandas datetime"
-        ] = lambda b: isinstance(b[-2], str) and is_dateconvertible(b[-2])
-        tests[
-            "datetim_max must be a string convertible to a Pandas datetime"
-        ] = lambda b: isinstance(b[-1], str) and is_dateconvertible(b[-1])
-
-    # Ranges:
-    tests["lon_min must be in [-180;180] or [0;360]"] = (
-        lambda b: b[0] >= -180.0 and b[0] <= 360.0
-    )
-    tests["lon_max must be in [-180;180] or [0;360]"] = (
-        lambda b: b[1] >= -180.0 and b[1] <= 360.0
-    )
-    tests["lat_min must be in [-90;90]"] = lambda b: b[2] >= -90.0 and b[2] <= 90
-    tests["lat_max must be in [-90;90]"] = lambda b: b[3] >= -90.0 and b[3] <= 90.0
-
-    # Orders:
-    tests["lon_max must be larger than lon_min"] = lambda b: b[0] < b[1]
-    tests["lat_max must be larger than lat_min"] = lambda b: b[2] < b[3]
-    if len(box) > 4:
-        tests["datetim_max must come after datetim_min"] = lambda b: pd.to_datetime(
-            b[-2]
-        ) < pd.to_datetime(b[-1])
-
-    error = None
-    for msg, test in tests.items():
-        if not test(box):
-            error = msg
-            break
-
-    if error and errors == "raise":
-        raise ValueError("%s: %s" % (box, error))
-    elif error:
-        return False
-    else:
-        return True
-
-
-def is_box(box: list, errors="raise"):
-    """Check if this array matches a 3d or 4d data box definition
-
-    Argopy expects one of the following 2 format to define a box:
-
-    - box = [lon_min, lon_max, lat_min, lat_max, pres_min, pres_max]
-    - box = [lon_min, lon_max, lat_min, lat_max, pres_min, pres_max, datim_min, datim_max]
-
-    This function check for this format compliance.
-
-    Parameters
-    ----------
-    box: list
-    errors: 'raise'
-
-    Returns
-    -------
-    bool
-    """
-
-    def is_dateconvertible(d):
-        try:
-            pd.to_datetime(d)
-            isit = True
-        except Exception:
-            isit = False
-        return isit
-
-    tests = {}
-    #     print(box)
-    # Formats:
-    tests["box must be a list"] = lambda b: isinstance(b, list)
-    tests["box must be a list with 6 or 8 elements"] = lambda b: len(b) in [6, 8]
-
-    # Types:
-    tests["lon_min must be numeric"] = lambda b: (
-        isinstance(b[0], int) or isinstance(b[0], (np.floating, float))
-    )
-    tests["lon_max must be numeric"] = lambda b: (
-        isinstance(b[1], int) or isinstance(b[1], (np.floating, float))
-    )
-    tests["lat_min must be numeric"] = lambda b: (
-        isinstance(b[2], int) or isinstance(b[2], (np.floating, float))
-    )
-    tests["lat_max must be numeric"] = lambda b: (
-        isinstance(b[3], int) or isinstance(b[3], (np.floating, float))
-    )
-    tests["pres_min must be numeric"] = lambda b: (
-        isinstance(b[4], int) or isinstance(b[4], (np.floating, float))
-    )
-    tests["pres_max must be numeric"] = lambda b: (
-        isinstance(b[5], int) or isinstance(b[5], (np.floating, float))
-    )
-    if len(box) == 8:
-        tests[
-            "datetim_min must be an object convertible to a Pandas datetime"
-        ] = lambda b: is_dateconvertible(b[-2])
-        tests[
-            "datetim_max must be an object convertible to a Pandas datetime"
-        ] = lambda b: is_dateconvertible(b[-1])
-
-    # Ranges:
-    tests["lon_min must be in [-180;180] or [0;360]"] = (
-        lambda b: b[0] >= -180.0 and b[0] <= 360.0
-    )
-    tests["lon_max must be in [-180;180] or [0;360]"] = (
-        lambda b: b[1] >= -180.0 and b[1] <= 360.0
-    )
-    tests["lat_min must be in [-90;90]"] = lambda b: b[2] >= -90.0 and b[2] <= 90
-    tests["lat_max must be in [-90;90]"] = lambda b: b[3] >= -90.0 and b[3] <= 90.0
-    tests["pres_min must be in [0;10000]"] = lambda b: b[4] >= 0 and b[4] <= 10000
-    tests["pres_max must be in [0;10000]"] = lambda b: b[5] >= 0 and b[5] <= 10000
-
-    # Orders:
-    tests["lon_max must be larger than lon_min"] = lambda b: b[0] <= b[1]
-    tests["lat_max must be larger than lat_min"] = lambda b: b[2] <= b[3]
-    tests["pres_max must be larger than pres_min"] = lambda b: b[4] <= b[5]
-    if len(box) == 8:
-        tests["datetim_max must come after datetim_min"] = lambda b: pd.to_datetime(
-            b[-2]
-        ) <= pd.to_datetime(b[-1])
-
-    error = None
-    for msg, test in tests.items():
-        if not test(box):
-            error = msg
-            break
-
-    if error and errors == "raise":
-        raise ValueError("%s: %s" % (box, error))
-    elif error:
-        return False
-    else:
-        return True
-
-
-def is_list_of_strings(lst):
-    return isinstance(lst, list) and all(isinstance(elem, str) for elem in lst)
-
-
-def is_list_of_dicts(lst):
-    return all(isinstance(x, dict) for x in lst)
-
-
-def is_list_of_datasets(lst):
-    return all(isinstance(x, xr.Dataset) for x in lst)
-
-
-def is_list_equal(lst1, lst2):
-    """ Return true if 2 lists contain same elements"""
-    return len(lst1) == len(lst2) and len(lst1) == sum(
-        [1 for i, j in zip(lst1, lst2) if i == j]
-    )
-
-
 def to_list(obj):
     """Make sure that an expected list is indeed a list"""
     if not isinstance(obj, list):
@@ -1574,176 +1382,6 @@ def to_list(obj):
     return obj
 
 
-def check_wmo(lst, errors="raise"):
-    """ Validate a WMO option and returned it as a list of integers
-
-    Parameters
-    ----------
-    wmo: int
-        WMO must be an integer or an iterable with elements that can be casted as integers
-    errors: {'raise', 'warn', 'ignore'}
-        Possibly raises a ValueError exception or UserWarning, otherwise fails silently.
-
-    Returns
-    -------
-    list(int)
-    """
-    is_wmo(lst, errors=errors)
-
-    # Make sure we deal with a list
-    lst = to_list(lst)
-
-    # Then cast list elements as integers
-    return [abs(int(x)) for x in lst]
-
-
-def is_wmo(lst, errors="raise"):  # noqa: C901
-    """ Check if a WMO is valid
-
-    Parameters
-    ----------
-    wmo: int, list(int), array(int)
-        WMO must be a single or a list of 5/7 digit positive numbers
-    errors: {'raise', 'warn', 'ignore'}
-        Possibly raises a ValueError exception or UserWarning, otherwise fails silently.
-
-    Returns
-    -------
-    bool
-        True if wmo is indeed a list of integers
-    """
-
-    # Make sure we deal with a list
-    lst = to_list(lst)
-
-    # Error message:
-    # msg = "WMO must be an integer or an iterable with elements that can be casted as integers"
-    msg = "WMO must be a single or a list of 5/7 digit positive numbers. Invalid: '{}'".format
-
-    # Then try to cast list elements as integers, return True if ok
-    result = True
-    try:
-        for x in lst:
-            if not str(x).isdigit():
-                result = False
-
-            if (len(str(x)) != 5) and (len(str(x)) != 7):
-                result = False
-
-            if int(x) <= 0:
-                result = False
-
-    except Exception:
-        result = False
-        if errors == "raise":
-            raise ValueError(msg(x))
-        elif errors == 'warn':
-            warnings.warn(msg(x))
-
-    if not result:
-        if errors == "raise":
-            raise ValueError(msg(x))
-        elif errors == 'warn':
-            warnings.warn(msg(x))
-    else:
-        return result
-
-
-def check_cyc(lst, errors="raise"):
-    """ Validate a CYC option and returned it as a list of integers
-
-    Parameters
-    ----------
-    cyc: int
-        CYC must be an integer or an iterable with elements that can be casted as positive integers
-    errors: {'raise', 'warn', 'ignore'}
-        Possibly raises a ValueError exception or UserWarning, otherwise fails silently.
-
-    Returns
-    -------
-    list(int)
-    """
-    is_cyc(lst, errors=errors)
-
-    # Make sure we deal with a list
-    lst = to_list(lst)
-
-    # Then cast list elements as integers
-    return [abs(int(x)) for x in lst]
-
-
-def is_cyc(lst, errors="raise"):  # noqa: C901
-    """ Check if a CYC is valid
-    Parameters
-    ----------
-    cyc: int, list(int), array(int)
-        CYC must be a single or a list of at most 4 digit positive numbers
-    errors: {'raise', 'warn', 'ignore'}
-        Possibly raises a ValueError exception or UserWarning, otherwise fails silently.
-    Returns
-    -------
-    bool
-        True if cyc is indeed a list of integers
-    """
-    # Make sure we deal with a list
-    lst = to_list(lst)
-
-    # Error message:
-    msg = "CYC must be a single or a list of at most 4 digit positive numbers. Invalid: '{}'".format
-
-    # Then try to cast list elements as integers, return True if ok
-    result = True
-    try:
-        for x in lst:
-            if not str(x).isdigit():
-                result = False
-
-            if (len(str(x)) > 4):
-                result = False
-
-            if int(x) < 0:
-                result = False
-
-    except Exception:
-        result = False
-        if errors == "raise":
-            raise ValueError(msg(x))
-        elif errors == 'warn':
-            warnings.warn(msg(x))
-
-    if not result:
-        if errors == "raise":
-            raise ValueError(msg(x))
-        elif errors == 'warn':
-            warnings.warn(msg(x))
-    else:
-        return result
-
-
-def check_index_cols(column_names: list, convention: str = 'ar_index_global_prof'):
-    """
-        ar_index_global_prof.txt: Index of profile files
-        Profile directory file of the Argo Global Data Assembly Center
-        file,date,latitude,longitude,ocean,profiler_type,institution,date_update
-
-        argo_bio-profile_index.txt: bgc Argo profiles index file
-        The directory file describes all individual bio-profile files of the argo GDAC ftp site.
-        file,date,latitude,longitude,ocean,profiler_type,institution,parameters,parameter_data_mode,date_update
-    """
-    # Default for 'ar_index_global_prof'
-    ref = ['file', 'date', 'latitude', 'longitude', 'ocean', 'profiler_type', 'institution',
-           'date_update']
-    if convention == 'argo_bio-profile_index' or convention == 'argo_synthetic-profile_index':
-        ref = ['file', 'date', 'latitude', 'longitude', 'ocean', 'profiler_type', 'institution',
-               'parameters', 'parameter_data_mode', 'date_update']
-
-    if not is_list_equal(column_names, ref):
-        # log.debug("Expected: %s, got: %s" % (";".join(ref), ";".join(column_names)))
-        raise InvalidDatasetStructure("Unexpected column names in this index !")
-    else:
-        return column_names
-
-
 def warnUnless(ok, txt):
     """Function to raise a warning unless condition is True
 
diff --git a/argopy/utils/__init__.py b/argopy/utils/__init__.py
index 6408e29e..a80c00f1 100644
--- a/argopy/utils/__init__.py
+++ b/argopy/utils/__init__.py
@@ -1,7 +1,20 @@
 from .monitored_threadpool import MyThreadPoolExecutor as MonitoredThreadPoolExecutor
-
+from .checkers import (
+    is_box, is_indexbox,
+    is_list_of_strings, is_list_of_dicts, is_list_of_datasets, is_list_equal,
+    is_wmo, check_wmo,
+    is_cyc, check_cyc,
+    check_index_cols,
+)
 
 __all__ = (
     # Classes:
     "MonitoredThreadPoolExecutor",
+
+    # Checkers:
+    "is_box", "is_indexbox",
+    "is_list_of_strings", "is_list_of_dicts", "is_list_of_datasets", "is_list_equal",
+    "is_wmo", "check_wmo",
+    "is_cyc", "check_cyc",
+    "check_index_cols",
 )
diff --git a/argopy/utils/checkers.py b/argopy/utils/checkers.py
new file mode 100644
index 00000000..6342c415
--- /dev/null
+++ b/argopy/utils/checkers.py
@@ -0,0 +1,377 @@
+import warnings
+import numpy as np
+import pandas as pd
+import xarray as xr
+from ..utilities import to_list
+from ..errors import InvalidDatasetStructure
+
+
+def is_indexbox(box: list, errors="raise"):
+    """ Check if this array matches a 2d or 3d index box definition
+
+    Argopy expects one of the following 2 format to define an index box:
+
+    - box = [lon_min, lon_max, lat_min, lat_max]
+    - box = [lon_min, lon_max, lat_min, lat_max, datim_min, datim_max]
+
+    This function check for this format compliance.
+
+    Parameters
+    ----------
+    box: list
+    errors: str, default='raise'
+
+    Returns
+    -------
+    bool
+    """
+    def is_dateconvertible(d):
+        try:
+            pd.to_datetime(d)
+            isit = True
+        except Exception:
+            isit = False
+        return isit
+
+    tests = {}
+
+    # Formats:
+    tests["index box must be a list"] = lambda b: isinstance(b, list)
+    tests["index box must be a list with 4 or 6 elements"] = lambda b: len(b) in [4, 6]
+
+    # Types:
+    tests["lon_min must be numeric"] = lambda b: (
+        isinstance(b[0], int) or isinstance(b[0], (np.floating, float))
+    )
+    tests["lon_max must be numeric"] = lambda b: (
+        isinstance(b[1], int) or isinstance(b[1], (np.floating, float))
+    )
+    tests["lat_min must be numeric"] = lambda b: (
+        isinstance(b[2], int) or isinstance(b[2], (np.floating, float))
+    )
+    tests["lat_max must be numeric"] = lambda b: (
+        isinstance(b[3], int) or isinstance(b[3], (np.floating, float))
+    )
+    if len(box) > 4:
+        tests[
+            "datetim_min must be a string convertible to a Pandas datetime"
+        ] = lambda b: isinstance(b[-2], str) and is_dateconvertible(b[-2])
+        tests[
+            "datetim_max must be a string convertible to a Pandas datetime"
+        ] = lambda b: isinstance(b[-1], str) and is_dateconvertible(b[-1])
+
+    # Ranges:
+    tests["lon_min must be in [-180;180] or [0;360]"] = (
+        lambda b: b[0] >= -180.0 and b[0] <= 360.0
+    )
+    tests["lon_max must be in [-180;180] or [0;360]"] = (
+        lambda b: b[1] >= -180.0 and b[1] <= 360.0
+    )
+    tests["lat_min must be in [-90;90]"] = lambda b: b[2] >= -90.0 and b[2] <= 90
+    tests["lat_max must be in [-90;90]"] = lambda b: b[3] >= -90.0 and b[3] <= 90.0
+
+    # Orders:
+    tests["lon_max must be larger than lon_min"] = lambda b: b[0] < b[1]
+    tests["lat_max must be larger than lat_min"] = lambda b: b[2] < b[3]
+    if len(box) > 4:
+        tests["datetim_max must come after datetim_min"] = lambda b: pd.to_datetime(
+            b[-2]
+        ) < pd.to_datetime(b[-1])
+
+    error = None
+    for msg, test in tests.items():
+        if not test(box):
+            error = msg
+            break
+
+    if error and errors == "raise":
+        raise ValueError("%s: %s" % (box, error))
+    elif error:
+        return False
+    else:
+        return True
+
+
+def is_box(box: list, errors="raise"):
+    """Check if this array matches a 3d or 4d data box definition
+
+    Argopy expects one of the following 2 format to define a box:
+
+    - box = [lon_min, lon_max, lat_min, lat_max, pres_min, pres_max]
+    - box = [lon_min, lon_max, lat_min, lat_max, pres_min, pres_max, datim_min, datim_max]
+
+    This function check for this format compliance.
+
+    Parameters
+    ----------
+    box: list
+    errors: 'raise'
+
+    Returns
+    -------
+    bool
+    """
+
+    def is_dateconvertible(d):
+        try:
+            pd.to_datetime(d)
+            isit = True
+        except Exception:
+            isit = False
+        return isit
+
+    tests = {}
+    #     print(box)
+    # Formats:
+    tests["box must be a list"] = lambda b: isinstance(b, list)
+    tests["box must be a list with 6 or 8 elements"] = lambda b: len(b) in [6, 8]
+
+    # Types:
+    tests["lon_min must be numeric"] = lambda b: (
+        isinstance(b[0], int) or isinstance(b[0], (np.floating, float))
+    )
+    tests["lon_max must be numeric"] = lambda b: (
+        isinstance(b[1], int) or isinstance(b[1], (np.floating, float))
+    )
+    tests["lat_min must be numeric"] = lambda b: (
+        isinstance(b[2], int) or isinstance(b[2], (np.floating, float))
+    )
+    tests["lat_max must be numeric"] = lambda b: (
+        isinstance(b[3], int) or isinstance(b[3], (np.floating, float))
+    )
+    tests["pres_min must be numeric"] = lambda b: (
+        isinstance(b[4], int) or isinstance(b[4], (np.floating, float))
+    )
+    tests["pres_max must be numeric"] = lambda b: (
+        isinstance(b[5], int) or isinstance(b[5], (np.floating, float))
+    )
+    if len(box) == 8:
+        tests[
+            "datetim_min must be an object convertible to a Pandas datetime"
+        ] = lambda b: is_dateconvertible(b[-2])
+        tests[
+            "datetim_max must be an object convertible to a Pandas datetime"
+        ] = lambda b: is_dateconvertible(b[-1])
+
+    # Ranges:
+    tests["lon_min must be in [-180;180] or [0;360]"] = (
+        lambda b: b[0] >= -180.0 and b[0] <= 360.0
+    )
+    tests["lon_max must be in [-180;180] or [0;360]"] = (
+        lambda b: b[1] >= -180.0 and b[1] <= 360.0
+    )
+    tests["lat_min must be in [-90;90]"] = lambda b: b[2] >= -90.0 and b[2] <= 90
+    tests["lat_max must be in [-90;90]"] = lambda b: b[3] >= -90.0 and b[3] <= 90.0
+    tests["pres_min must be in [0;10000]"] = lambda b: b[4] >= 0 and b[4] <= 10000
+    tests["pres_max must be in [0;10000]"] = lambda b: b[5] >= 0 and b[5] <= 10000
+
+    # Orders:
+    tests["lon_max must be larger than lon_min"] = lambda b: b[0] <= b[1]
+    tests["lat_max must be larger than lat_min"] = lambda b: b[2] <= b[3]
+    tests["pres_max must be larger than pres_min"] = lambda b: b[4] <= b[5]
+    if len(box) == 8:
+        tests["datetim_max must come after datetim_min"] = lambda b: pd.to_datetime(
+            b[-2]
+        ) <= pd.to_datetime(b[-1])
+
+    error = None
+    for msg, test in tests.items():
+        if not test(box):
+            error = msg
+            break
+
+    if error and errors == "raise":
+        raise ValueError("%s: %s" % (box, error))
+    elif error:
+        return False
+    else:
+        return True
+
+
+def is_list_of_strings(lst):
+    return isinstance(lst, list) and all(isinstance(elem, str) for elem in lst)
+
+
+def is_list_of_dicts(lst):
+    return all(isinstance(x, dict) for x in lst)
+
+
+def is_list_of_datasets(lst):
+    return all(isinstance(x, xr.Dataset) for x in lst)
+
+
+def is_list_equal(lst1, lst2):
+    """ Return true if 2 lists contain same elements"""
+    return len(lst1) == len(lst2) and len(lst1) == sum(
+        [1 for i, j in zip(lst1, lst2) if i == j]
+    )
+
+
+def check_wmo(lst, errors="raise"):
+    """ Validate a WMO option and returned it as a list of integers
+
+    Parameters
+    ----------
+    wmo: int
+        WMO must be an integer or an iterable with elements that can be casted as integers
+    errors: {'raise', 'warn', 'ignore'}
+        Possibly raises a ValueError exception or UserWarning, otherwise fails silently.
+
+    Returns
+    -------
+    list(int)
+    """
+    is_wmo(lst, errors=errors)
+
+    # Make sure we deal with a list
+    lst = to_list(lst)
+
+    # Then cast list elements as integers
+    return [abs(int(x)) for x in lst]
+
+
+def is_wmo(lst, errors="raise"):  # noqa: C901
+    """ Check if a WMO is valid
+
+    Parameters
+    ----------
+    wmo: int, list(int), array(int)
+        WMO must be a single or a list of 5/7 digit positive numbers
+    errors: {'raise', 'warn', 'ignore'}
+        Possibly raises a ValueError exception or UserWarning, otherwise fails silently.
+
+    Returns
+    -------
+    bool
+        True if wmo is indeed a list of integers
+    """
+
+    # Make sure we deal with a list
+    lst = to_list(lst)
+
+    # Error message:
+    # msg = "WMO must be an integer or an iterable with elements that can be casted as integers"
+    msg = "WMO must be a single or a list of 5/7 digit positive numbers. Invalid: '{}'".format
+
+    # Then try to cast list elements as integers, return True if ok
+    result = True
+    try:
+        for x in lst:
+            if not str(x).isdigit():
+                result = False
+
+            if (len(str(x)) != 5) and (len(str(x)) != 7):
+                result = False
+
+            if int(x) <= 0:
+                result = False
+
+    except Exception:
+        result = False
+        if errors == "raise":
+            raise ValueError(msg(x))
+        elif errors == 'warn':
+            warnings.warn(msg(x))
+
+    if not result:
+        if errors == "raise":
+            raise ValueError(msg(x))
+        elif errors == 'warn':
+            warnings.warn(msg(x))
+    else:
+        return result
+
+
+def check_cyc(lst, errors="raise"):
+    """ Validate a CYC option and returned it as a list of integers
+
+    Parameters
+    ----------
+    cyc: int
+        CYC must be an integer or an iterable with elements that can be casted as positive integers
+    errors: {'raise', 'warn', 'ignore'}
+        Possibly raises a ValueError exception or UserWarning, otherwise fails silently.
+
+    Returns
+    -------
+    list(int)
+    """
+    is_cyc(lst, errors=errors)
+
+    # Make sure we deal with a list
+    lst = to_list(lst)
+
+    # Then cast list elements as integers
+    return [abs(int(x)) for x in lst]
+
+
+def is_cyc(lst, errors="raise"):  # noqa: C901
+    """ Check if a CYC is valid
+    Parameters
+    ----------
+    cyc: int, list(int), array(int)
+        CYC must be a single or a list of at most 4 digit positive numbers
+    errors: {'raise', 'warn', 'ignore'}
+        Possibly raises a ValueError exception or UserWarning, otherwise fails silently.
+    Returns
+    -------
+    bool
+        True if cyc is indeed a list of integers
+    """
+    # Make sure we deal with a list
+    lst = to_list(lst)
+
+    # Error message:
+    msg = "CYC must be a single or a list of at most 4 digit positive numbers. Invalid: '{}'".format
+
+    # Then try to cast list elements as integers, return True if ok
+    result = True
+    try:
+        for x in lst:
+            if not str(x).isdigit():
+                result = False
+
+            if (len(str(x)) > 4):
+                result = False
+
+            if int(x) < 0:
+                result = False
+
+    except Exception:
+        result = False
+        if errors == "raise":
+            raise ValueError(msg(x))
+        elif errors == 'warn':
+            warnings.warn(msg(x))
+
+    if not result:
+        if errors == "raise":
+            raise ValueError(msg(x))
+        elif errors == 'warn':
+            warnings.warn(msg(x))
+    else:
+        return result
+
+
+def check_index_cols(column_names: list, convention: str = 'ar_index_global_prof'):
+    """
+        ar_index_global_prof.txt: Index of profile files
+        Profile directory file of the Argo Global Data Assembly Center
+        file,date,latitude,longitude,ocean,profiler_type,institution,date_update
+
+        argo_bio-profile_index.txt: bgc Argo profiles index file
+        The directory file describes all individual bio-profile files of the argo GDAC ftp site.
+        file,date,latitude,longitude,ocean,profiler_type,institution,parameters,parameter_data_mode,date_update
+    """
+    # Default for 'ar_index_global_prof'
+    ref = ['file', 'date', 'latitude', 'longitude', 'ocean', 'profiler_type', 'institution',
+           'date_update']
+    if convention == 'argo_bio-profile_index' or convention == 'argo_synthetic-profile_index':
+        ref = ['file', 'date', 'latitude', 'longitude', 'ocean', 'profiler_type', 'institution',
+               'parameters', 'parameter_data_mode', 'date_update']
+
+    if not is_list_equal(column_names, ref):
+        # log.debug("Expected: %s, got: %s" % (";".join(ref), ";".join(column_names)))
+        raise InvalidDatasetStructure("Unexpected column names in this index !")
+    else:
+        return column_names

From a5da1766b9483918f63c81c4430c0df4c899f32e Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Fri, 8 Sep 2023 09:50:47 +0200
Subject: [PATCH 14/33] [skip-ci]

---
 argopy/data_fetchers/erddap_data.py           |  20 +-
 argopy/plot/dashboards.py                     |   3 +-
 argopy/plot/plot.py                           |   3 +-
 argopy/related/__init__.py                    |   5 +
 argopy/related/euroargo_api.py                | 101 ++
 argopy/stores/argo_index_pa.py                |   2 +-
 argopy/stores/argo_index_pd.py                |   2 +-
 argopy/tests/test_fetchers_data_argovis.py    |   2 +-
 argopy/tests/test_fetchers_data_erddap.py     |   2 +-
 argopy/tests/test_fetchers_data_erddap_bgc.py |   2 +-
 argopy/tests/test_fetchers_data_gdac.py       |   3 +-
 argopy/tests/test_fetchers_facade_data.py     |   2 +-
 argopy/tests/test_fetchers_index_gdac.py      |   3 +-
 argopy/tests/test_fetchers_proto.py           |   2 +-
 argopy/tests/test_stores_fsspec.py            |   4 +-
 argopy/tests/test_stores_index.py             |   2 +-
 argopy/tests/test_utilities.py                | 180 +---
 argopy/tests/test_utils_checkers.py           | 179 ++++
 argopy/utilities.py                           | 900 +-----------------
 argopy/utils/__init__.py                      |  27 +
 argopy/utils/casting.py                       | 376 ++++++++
 argopy/utils/checkers.py                      |  97 +-
 argopy/utils/decorators.py                    | 154 +++
 argopy/utils/lists.py                         | 198 ++++
 argopy/xarray.py                              |  12 +-
 25 files changed, 1178 insertions(+), 1103 deletions(-)
 create mode 100644 argopy/related/euroargo_api.py
 create mode 100644 argopy/tests/test_utils_checkers.py
 create mode 100644 argopy/utils/casting.py
 create mode 100644 argopy/utils/decorators.py
 create mode 100644 argopy/utils/lists.py

diff --git a/argopy/data_fetchers/erddap_data.py b/argopy/data_fetchers/erddap_data.py
index 9ac5d3b4..c3d3ea58 100644
--- a/argopy/data_fetchers/erddap_data.py
+++ b/argopy/data_fetchers/erddap_data.py
@@ -21,18 +21,16 @@
 import getpass
 from typing import Union
 import fnmatch
+from aiohttp import ClientResponseError
+import logging
 
 from .proto import ArgoDataFetcherProto
-from argopy.options import OPTIONS
-from argopy.utilities import Chunker, format_oneline, to_list
-from argopy.stores import httpstore
+from ..options import OPTIONS
+from ..utilities import Chunker, format_oneline
+from ..stores import httpstore
 from ..errors import ErddapServerError, DataNotFound
-from ..stores import (
-    indexstore_pd as ArgoIndex,
-)  # make sure to work with the Pandas index store
-
-from aiohttp import ClientResponseError
-import logging
+from ..stores import indexstore_pd as ArgoIndex  # make sure we work with the Pandas index store
+from ..utils import is_list_of_strings, to_list
 
 # Load erddapy according to available version (breaking changes in v0.8.0)
 try:
@@ -201,7 +199,7 @@ def __init__(  # noqa: C901
                 raise ValueError()
             elif params[0] == "all":
                 params = self._bgc_vlist_avail
-            elif not argopy.utilities.is_list_of_strings(params):
+            elif not is_list_of_strings(params):
                 raise ValueError("'params' argument must be a list of strings")
                 # raise ValueError("'params' argument must be a list of strings (possibly with a * wildcard)")
             self._bgc_vlist_requested = [p.upper() for p in params]
@@ -222,7 +220,7 @@ def __init__(  # noqa: C901
                 measured = []
             elif self._bgc_measured[0] == "all":
                 measured = self._bgc_vlist_requested
-            elif not argopy.utilities.is_list_of_strings(self._bgc_measured):
+            elif not is_list_of_strings(self._bgc_measured):
                 raise ValueError("'measured' argument must be a list of strings")
                 # raise ValueError("'measured' argument must be a list of strings (possibly with a * wildcard)")
             self._bgc_vlist_measured = [m.upper() for m in measured]
diff --git a/argopy/plot/dashboards.py b/argopy/plot/dashboards.py
index 6b513e1f..5f95d0f2 100644
--- a/argopy/plot/dashboards.py
+++ b/argopy/plot/dashboards.py
@@ -11,7 +11,8 @@
 from packaging import version
 
 from .utils import has_ipython
-from ..utilities import warnUnless, check_wmo, check_cyc, get_ea_profile_page
+from ..utilities import warnUnless, get_ea_profile_page
+from ..utils import check_wmo, check_cyc
 from ..errors import InvalidDashboard
 from .. import __version__ as argopy_version
 
diff --git a/argopy/plot/plot.py b/argopy/plot/plot.py
index d9e52c12..22248777 100644
--- a/argopy/plot/plot.py
+++ b/argopy/plot/plot.py
@@ -18,7 +18,8 @@
 from .utils import axes_style, latlongrid, land_feature
 from .argo_colors import ArgoColors
 
-from ..utilities import warnUnless, check_wmo
+from ..utilities import warnUnless
+from ..utils import check_wmo
 from ..errors import InvalidDatasetStructure
 
 if has_mpl:
diff --git a/argopy/related/__init__.py b/argopy/related/__init__.py
index 84c62f22..5c960c9d 100644
--- a/argopy/related/__init__.py
+++ b/argopy/related/__init__.py
@@ -3,6 +3,7 @@
 from .reference_tables import ArgoNVSReferenceTables
 from .argo_documentation import ArgoDocs
 from .doi_snapshot import ArgoDOI
+from .euroargo_api import get_coriolis_profile_id, get_ea_profile_page
 
 
 #
@@ -13,4 +14,8 @@
     "ArgoNVSReferenceTables",
     "ArgoDocs",
     "ArgoDOI",
+
+    # Functions:
+    "get_coriolis_profile_id",
+    "get_ea_profile_page",
 )
diff --git a/argopy/related/euroargo_api.py b/argopy/related/euroargo_api.py
new file mode 100644
index 00000000..b9e9b8b6
--- /dev/null
+++ b/argopy/related/euroargo_api.py
@@ -0,0 +1,101 @@
+import pandas as pd
+from ..options import OPTIONS
+from ..utils import check_wmo, check_cyc
+from ..stores import httpstore
+
+
+def get_coriolis_profile_id(WMO, CYC=None, **kwargs):
+    """ Return a :class:`pandas.DataFrame` with CORIOLIS ID of WMO/CYC profile pairs
+
+        This method get ID by requesting the dataselection.euro-argo.eu trajectory API.
+
+        Parameters
+        ----------
+        WMO: int, list(int)
+            Define the list of Argo floats. This is a list of integers with WMO float identifiers.
+            WMO is the World Meteorological Organization.
+        CYC: int, list(int)
+            Define the list of cycle numbers to load ID for each Argo floats listed in ``WMO``.
+
+        Returns
+        -------
+        :class:`pandas.DataFrame`
+    """
+    WMO_list = check_wmo(WMO)
+    if CYC is not None:
+        CYC_list = check_cyc(CYC)
+    if 'api_server' in kwargs:
+        api_server = kwargs['api_server']
+    elif OPTIONS['server'] is not None:
+        api_server = OPTIONS['server']
+    else:
+        api_server = "https://dataselection.euro-argo.eu/api"
+    URIs = [api_server + "/trajectory/%i" % wmo for wmo in WMO_list]
+
+    def prec(data, url):
+        # Transform trajectory json to dataframe
+        # See: https://dataselection.euro-argo.eu/swagger-ui.html#!/cycle-controller/getCyclesByPlatformCodeUsingGET
+        WMO = check_wmo(url.split("/")[-1])[0]
+        rows = []
+        for profile in data:
+            keys = [x for x in profile.keys() if x not in ["coordinate"]]
+            meta_row = dict((key, profile[key]) for key in keys)
+            for row in profile["coordinate"]:
+                meta_row[row] = profile["coordinate"][row]
+            meta_row["WMO"] = WMO
+            rows.append(meta_row)
+        return pd.DataFrame(rows)
+
+    fs = httpstore(cache=True, cachedir=OPTIONS['cachedir'])
+    data = fs.open_mfjson(URIs, preprocess=prec, errors="raise", url_follow=True)
+
+    # Merge results (list of dataframe):
+    key_map = {
+        "id": "ID",
+        "lat": "LATITUDE",
+        "lon": "LONGITUDE",
+        "cvNumber": "CYCLE_NUMBER",
+        "level": "level",
+        "WMO": "PLATFORM_NUMBER",
+    }
+    for i, df in enumerate(data):
+        df = df.reset_index()
+        df = df.rename(columns=key_map)
+        df = df[[value for value in key_map.values() if value in df.columns]]
+        data[i] = df
+    df = pd.concat(data, ignore_index=True)
+    df.sort_values(by=["PLATFORM_NUMBER", "CYCLE_NUMBER"], inplace=True)
+    df = df.reset_index(drop=True)
+    # df = df.set_index(["PLATFORM_NUMBER", "CYCLE_NUMBER"])
+    df = df.astype({"ID": int})
+    if CYC is not None:
+        df = pd.concat([df[df["CYCLE_NUMBER"] == cyc] for cyc in CYC_list]).reset_index(
+            drop=True
+        )
+    return df[
+        ["PLATFORM_NUMBER", "CYCLE_NUMBER", "ID", "LATITUDE", "LONGITUDE", "level"]
+    ]
+
+
+def get_ea_profile_page(WMO, CYC=None, **kwargs):
+    """ Return a list of URL
+
+        Parameters
+        ----------
+        WMO: int, list(int)
+            WMO must be an integer or an iterable with elements that can be casted as integers
+        CYC: int, list(int), default (None)
+            CYC must be an integer or an iterable with elements that can be casted as positive integers
+
+        Returns
+        -------
+        list(str)
+
+        See also
+        --------
+        get_coriolis_profile_id
+    """
+    df = get_coriolis_profile_id(WMO, CYC, **kwargs)
+    url = "https://dataselection.euro-argo.eu/cycle/{}"
+    return [url.format(this_id) for this_id in sorted(df["ID"])]
+
diff --git a/argopy/stores/argo_index_pa.py b/argopy/stores/argo_index_pa.py
index 83d10ea4..df17b348 100644
--- a/argopy/stores/argo_index_pa.py
+++ b/argopy/stores/argo_index_pa.py
@@ -12,7 +12,7 @@
 from packaging import version
 
 from ..errors import DataNotFound, InvalidDatasetStructure
-from ..utilities import check_index_cols, is_indexbox, check_wmo, check_cyc, to_list
+from ..utils import check_index_cols, is_indexbox, check_wmo, check_cyc, to_list
 from .argo_index_proto import ArgoIndexStoreProto
 try:
     import pyarrow.csv as csv  # noqa: F401
diff --git a/argopy/stores/argo_index_pd.py b/argopy/stores/argo_index_pd.py
index 5e69daed..7c00fca2 100644
--- a/argopy/stores/argo_index_pd.py
+++ b/argopy/stores/argo_index_pd.py
@@ -10,7 +10,7 @@
 import gzip
 
 from ..errors import DataNotFound, InvalidDatasetStructure
-from ..utilities import check_index_cols, is_indexbox, check_wmo, check_cyc, to_list
+from ..utils import check_index_cols, is_indexbox, check_wmo, check_cyc, to_list
 from .argo_index_proto import ArgoIndexStoreProto
 
 
diff --git a/argopy/tests/test_fetchers_data_argovis.py b/argopy/tests/test_fetchers_data_argovis.py
index 6a083837..1db64d2b 100644
--- a/argopy/tests/test_fetchers_data_argovis.py
+++ b/argopy/tests/test_fetchers_data_argovis.py
@@ -13,7 +13,7 @@
     CacheFileNotFound,
     FileSystemHasNoCache,
 )
-from argopy.utilities import is_list_of_strings
+from argopy.utils import is_list_of_strings
 from utils import requires_connected_argovis, safe_to_server_errors
 
 
diff --git a/argopy/tests/test_fetchers_data_erddap.py b/argopy/tests/test_fetchers_data_erddap.py
index a0f299e6..eecf96a2 100644
--- a/argopy/tests/test_fetchers_data_erddap.py
+++ b/argopy/tests/test_fetchers_data_erddap.py
@@ -1,7 +1,7 @@
 import logging
 
 from argopy import DataFetcher as ArgoDataFetcher
-from argopy.utilities import is_list_of_strings
+from argopy.utils import is_list_of_strings
 
 import pytest
 import xarray as xr
diff --git a/argopy/tests/test_fetchers_data_erddap_bgc.py b/argopy/tests/test_fetchers_data_erddap_bgc.py
index c01f230e..d3696e0a 100644
--- a/argopy/tests/test_fetchers_data_erddap_bgc.py
+++ b/argopy/tests/test_fetchers_data_erddap_bgc.py
@@ -2,7 +2,7 @@
 import numpy as np
 
 from argopy import DataFetcher as ArgoDataFetcher
-from argopy.utilities import is_list_of_strings
+from argopy.utils import is_list_of_strings
 from argopy.stores import indexstore_pd as ArgoIndex  # make sure to work with the Pandas index store with erddap-bgc
 
 import pytest
diff --git a/argopy/tests/test_fetchers_data_gdac.py b/argopy/tests/test_fetchers_data_gdac.py
index 4fd6c184..94faa7af 100644
--- a/argopy/tests/test_fetchers_data_gdac.py
+++ b/argopy/tests/test_fetchers_data_gdac.py
@@ -19,7 +19,8 @@
     FileSystemHasNoCache,
     FtpPathError,
 )
-from argopy.utilities import is_list_of_strings, isconnected
+from argopy.utilities import isconnected
+from argopy.utils import is_list_of_strings
 from utils import requires_gdac
 from mocked_http import mocked_httpserver, mocked_server_address
 from collections import ChainMap
diff --git a/argopy/tests/test_fetchers_facade_data.py b/argopy/tests/test_fetchers_facade_data.py
index 944a1611..17e0646c 100644
--- a/argopy/tests/test_fetchers_facade_data.py
+++ b/argopy/tests/test_fetchers_facade_data.py
@@ -10,7 +10,7 @@
     InvalidFetcher,
     OptionValueError,
 )
-from argopy.utilities import is_list_of_strings
+from argopy.utils import is_list_of_strings
 from utils import (
     requires_fetcher,
     requires_connection,
diff --git a/argopy/tests/test_fetchers_index_gdac.py b/argopy/tests/test_fetchers_index_gdac.py
index efd73afc..d5f23200 100644
--- a/argopy/tests/test_fetchers_index_gdac.py
+++ b/argopy/tests/test_fetchers_index_gdac.py
@@ -13,7 +13,8 @@
     FileSystemHasNoCache,
     FtpPathError
 )
-from argopy.utilities import is_list_of_strings, isconnected
+from argopy.utilities import isconnected
+from argopy.utils import is_list_of_strings
 from utils import requires_gdac
 from mocked_http import mocked_httpserver, mocked_server_address
 
diff --git a/argopy/tests/test_fetchers_proto.py b/argopy/tests/test_fetchers_proto.py
index 0912cad7..24f669ff 100644
--- a/argopy/tests/test_fetchers_proto.py
+++ b/argopy/tests/test_fetchers_proto.py
@@ -1,7 +1,7 @@
 import pytest
 import xarray
 from argopy.data_fetchers.proto import ArgoDataFetcherProto
-from argopy.utilities import to_list
+from argopy.utils import to_list
 
 
 class Fetcher(ArgoDataFetcherProto):
diff --git a/argopy/tests/test_stores_fsspec.py b/argopy/tests/test_stores_fsspec.py
index 1ad338ae..b2766d5b 100644
--- a/argopy/tests/test_stores_fsspec.py
+++ b/argopy/tests/test_stores_fsspec.py
@@ -30,9 +30,11 @@
     DataNotFound,
 )
 from argopy.utilities import (
+    modified_environ,
+)
+from argopy.utils import (
     is_list_of_datasets,
     is_list_of_dicts,
-    modified_environ,
 )
 from utils import requires_connection, requires_connected_argovis
 from mocked_http import mocked_httpserver, mocked_server_address
diff --git a/argopy/tests/test_stores_index.py b/argopy/tests/test_stores_index.py
index 49b791ad..36823bf0 100644
--- a/argopy/tests/test_stores_index.py
+++ b/argopy/tests/test_stores_index.py
@@ -16,7 +16,7 @@
     OptionValueError,
     InvalidDatasetStructure,
 )
-from argopy.utilities import (
+from argopy.utils import (
     is_list_of_strings,
 )
 from argopy.stores.argo_index_pd import indexstore_pandas
diff --git a/argopy/tests/test_utilities.py b/argopy/tests/test_utilities.py
index 24d37cb5..4f691037 100644
--- a/argopy/tests/test_utilities.py
+++ b/argopy/tests/test_utilities.py
@@ -20,11 +20,7 @@
     erddap_ds_exists,
     linear_interpolation_remap,
     Chunker,
-    is_box,
-    is_list_of_strings,
-    format_oneline, is_indexbox,
-    check_wmo, is_wmo,
-    check_cyc, is_cyc,
+    format_oneline,
     wmo2box,
     modified_environ,
     wrap_longitude,
@@ -35,6 +31,10 @@
     get_coriolis_profile_id,
     get_ea_profile_page,
 )
+from argopy.utils import (
+    is_box,
+    is_list_of_strings,
+)
 from argopy.errors import InvalidFetcherAccessPoint, FtpPathError
 from argopy import DataFetcher as ArgoDataFetcher
 from utils import (
@@ -394,104 +394,6 @@ def test_chunk_box4d(self):
         )
 
 
-class Test_is_box:
-    @pytest.fixture(autouse=True)
-    def create_data(self):
-        self.BOX3d = [0, 20, 40, 60, 0, 1000]
-        self.BOX4d = [0, 20, 40, 60, 0, 1000, "2001-01", "2001-6"]
-
-    def test_box_ok(self):
-        assert is_box(self.BOX3d)
-        assert is_box(self.BOX4d)
-
-    def test_box_notok(self):
-        for box in [[], list(range(0, 12))]:
-            with pytest.raises(ValueError):
-                is_box(box)
-            with pytest.raises(ValueError):
-                is_box(box, errors="raise")
-            assert not is_box(box, errors="ignore")
-
-    def test_box_invalid_num(self):
-        for i in [0, 1, 2, 3, 4, 5]:
-            box = self.BOX3d
-            box[i] = "str"
-            with pytest.raises(ValueError):
-                is_box(box)
-            with pytest.raises(ValueError):
-                is_box(box, errors="raise")
-            assert not is_box(box, errors="ignore")
-
-    def test_box_invalid_range(self):
-        for i in [0, 1, 2, 3, 4, 5]:
-            box = self.BOX3d
-            box[i] = -1000
-            with pytest.raises(ValueError):
-                is_box(box)
-            with pytest.raises(ValueError):
-                is_box(box, errors="raise")
-            assert not is_box(box, errors="ignore")
-
-    def test_box_invalid_str(self):
-        for i in [6, 7]:
-            box = self.BOX4d
-            box[i] = "str"
-            with pytest.raises(ValueError):
-                is_box(box)
-            with pytest.raises(ValueError):
-                is_box(box, errors="raise")
-            assert not is_box(box, errors="ignore")
-
-
-class Test_is_indexbox:
-    @pytest.fixture(autouse=True)
-    def create_data(self):
-        self.BOX2d = [0, 20, 40, 60]
-        self.BOX3d = [0, 20, 40, 60, "2001-01", "2001-6"]
-
-    def test_box_ok(self):
-        assert is_indexbox(self.BOX2d)
-        assert is_indexbox(self.BOX3d)
-
-    def test_box_notok(self):
-        for box in [[], list(range(0, 12))]:
-            with pytest.raises(ValueError):
-                is_indexbox(box)
-            with pytest.raises(ValueError):
-                is_indexbox(box, errors="raise")
-            assert not is_indexbox(box, errors="ignore")
-
-    def test_box_invalid_num(self):
-        for i in [0, 1, 2, 3]:
-            box = self.BOX2d
-            box[i] = "str"
-            with pytest.raises(ValueError):
-                is_indexbox(box)
-            with pytest.raises(ValueError):
-                is_indexbox(box, errors="raise")
-            assert not is_indexbox(box, errors="ignore")
-
-    def test_box_invalid_range(self):
-        for i in [0, 1, 2, 3]:
-            box = self.BOX2d
-            box[i] = -1000
-            with pytest.raises(ValueError):
-                is_indexbox(box)
-            with pytest.raises(ValueError):
-                is_indexbox(box, errors="raise")
-            assert not is_indexbox(box, errors="ignore")
-
-    def test_box_invalid_str(self):
-        for i in [4, 5]:
-            box = self.BOX3d
-            box[i] = "str"
-            with pytest.raises(ValueError):
-                is_indexbox(box)
-            with pytest.raises(ValueError):
-                is_indexbox(box, errors="raise")
-            assert not is_indexbox(box, errors="ignore")
-
-
 def test_format_oneline():
     s = "Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do eiusmod tempor incididunt ut labore et dolore"
     assert isinstance(format_oneline(s), str)
@@ -500,78 +402,6 @@ def test_format_oneline():
     assert isinstance(s, str) and len(s) == 12
 
 
-def test_is_wmo():
-    assert is_wmo(12345)
-    assert is_wmo([12345])
-    assert is_wmo([12345, 1234567])
-
-    with pytest.raises(ValueError):
-        is_wmo(1234, errors="raise")
-    with pytest.raises(ValueError):
-        is_wmo(-1234, errors="raise")
-    with pytest.raises(ValueError):
-        is_wmo(1234.12, errors="raise")
-    with pytest.raises(ValueError):
-        is_wmo(12345.7, errors="raise")
-
-    with pytest.warns(UserWarning):
-        is_wmo(1234, errors="warn")
-    with pytest.warns(UserWarning):
-        is_wmo(-1234, errors="warn")
-    with pytest.warns(UserWarning):
-        is_wmo(1234.12, errors="warn")
-    with pytest.warns(UserWarning):
-        is_wmo(12345.7, errors="warn")
-
-    assert not is_wmo(12, errors="ignore")
-    assert not is_wmo(-12, errors="ignore")
-    assert not is_wmo(1234.12, errors="ignore")
-    assert not is_wmo(12345.7, errors="ignore")
-
-
-def test_check_wmo():
-    assert check_wmo(12345) == [12345]
-    assert check_wmo([1234567]) == [1234567]
-    assert check_wmo([12345, 1234567]) == [12345, 1234567]
-    assert check_wmo(np.array((12345, 1234567), dtype='int')) == [12345, 1234567]
-
-
-def test_is_cyc():
-    assert is_cyc(123)
-    assert is_cyc([123])
-    assert is_cyc([12, 123, 1234])
-
-    with pytest.raises(ValueError):
-        is_cyc(12345, errors="raise")
-    with pytest.raises(ValueError):
-        is_cyc(-1234, errors="raise")
-    with pytest.raises(ValueError):
-        is_cyc(1234.12, errors="raise")
-    with pytest.raises(ValueError):
-        is_cyc(12345.7, errors="raise")
-
-    with pytest.warns(UserWarning):
-        is_cyc(12345, errors="warn")
-    with pytest.warns(UserWarning):
-        is_cyc(-1234, errors="warn")
-    with pytest.warns(UserWarning):
-        is_cyc(1234.12, errors="warn")
-    with pytest.warns(UserWarning):
-        is_cyc(12345.7, errors="warn")
-
-    assert not is_cyc(12345, errors="ignore")
-    assert not is_cyc(-12, errors="ignore")
-    assert not is_cyc(1234.12, errors="ignore")
-    assert not is_cyc(12345.7, errors="ignore")
-
-
-def test_check_cyc():
-    assert check_cyc(123) == [123]
-    assert check_cyc([12]) == [12]
-    assert check_cyc([12, 123]) == [12, 123]
-    assert check_cyc(np.array((123, 1234), dtype='int')) == [123, 1234]
-
-
 def test_modified_environ():
     os.environ["DUMMY_ENV_ARGOPY"] = 'initial'
     with modified_environ(DUMMY_ENV_ARGOPY='toto'):
diff --git a/argopy/tests/test_utils_checkers.py b/argopy/tests/test_utils_checkers.py
new file mode 100644
index 00000000..5ccc14af
--- /dev/null
+++ b/argopy/tests/test_utils_checkers.py
@@ -0,0 +1,179 @@
+import pytest
+import numpy as np
+
+from argopy.utils import (
+    is_box, is_indexbox,
+    check_wmo, is_wmo,
+    check_cyc, is_cyc,
+)
+
+
+class Test_is_box:
+    @pytest.fixture(autouse=True)
+    def create_data(self):
+        self.BOX3d = [0, 20, 40, 60, 0, 1000]
+        self.BOX4d = [0, 20, 40, 60, 0, 1000, "2001-01", "2001-6"]
+
+    def test_box_ok(self):
+        assert is_box(self.BOX3d)
+        assert is_box(self.BOX4d)
+
+    def test_box_notok(self):
+        for box in [[], list(range(0, 12))]:
+            with pytest.raises(ValueError):
+                is_box(box)
+            with pytest.raises(ValueError):
+                is_box(box, errors="raise")
+            assert not is_box(box, errors="ignore")
+
+    def test_box_invalid_num(self):
+        for i in [0, 1, 2, 3, 4, 5]:
+            box = self.BOX3d
+            box[i] = "str"
+            with pytest.raises(ValueError):
+                is_box(box)
+            with pytest.raises(ValueError):
+                is_box(box, errors="raise")
+            assert not is_box(box, errors="ignore")
+
+    def test_box_invalid_range(self):
+        for i in [0, 1, 2, 3, 4, 5]:
+            box = self.BOX3d
+            box[i] = -1000
+            with pytest.raises(ValueError):
+                is_box(box)
+            with pytest.raises(ValueError):
+                is_box(box, errors="raise")
+            assert not is_box(box, errors="ignore")
+
+    def test_box_invalid_str(self):
+        for i in [6, 7]:
+            box = self.BOX4d
+            box[i] = "str"
+            with pytest.raises(ValueError):
+                is_box(box)
+            with pytest.raises(ValueError):
+                is_box(box, errors="raise")
+            assert not is_box(box, errors="ignore")
+
+
+class Test_is_indexbox:
+    @pytest.fixture(autouse=True)
+    def create_data(self):
+        self.BOX2d = [0, 20, 40, 60]
+        self.BOX3d = [0, 20, 40, 60, "2001-01", "2001-6"]
+
+    def test_box_ok(self):
+        assert is_indexbox(self.BOX2d)
+        assert is_indexbox(self.BOX3d)
+
+    def test_box_notok(self):
+        for box in [[], list(range(0, 12))]:
+            with pytest.raises(ValueError):
+                is_indexbox(box)
+            with pytest.raises(ValueError):
+                is_indexbox(box, errors="raise")
+            assert not is_indexbox(box, errors="ignore")
+
+    def test_box_invalid_num(self):
+        for i in [0, 1, 2, 3]:
+            box = self.BOX2d
+            box[i] = "str"
+            with pytest.raises(ValueError):
+                is_indexbox(box)
+            with pytest.raises(ValueError):
+                is_indexbox(box, errors="raise")
+            assert not is_indexbox(box, errors="ignore")
+
+    def test_box_invalid_range(self):
+        for i in [0, 1, 2, 3]:
+            box = self.BOX2d
+            box[i] = -1000
+            with pytest.raises(ValueError):
+                is_indexbox(box)
+            with pytest.raises(ValueError):
+                is_indexbox(box, errors="raise")
+            assert not is_indexbox(box, errors="ignore")
+
+    def test_box_invalid_str(self):
+        for i in [4, 5]:
+            box = self.BOX3d
+            box[i] = "str"
+            with pytest.raises(ValueError):
+                is_indexbox(box)
+            with pytest.raises(ValueError):
+                is_indexbox(box, errors="raise")
+            assert not is_indexbox(box, errors="ignore")
+
+
+def test_is_wmo():
+    assert is_wmo(12345)
+    assert is_wmo([12345])
+    assert is_wmo([12345, 1234567])
+
+    with pytest.raises(ValueError):
+        is_wmo(1234, errors="raise")
+    with pytest.raises(ValueError):
+        is_wmo(-1234, errors="raise")
+    with pytest.raises(ValueError):
+        is_wmo(1234.12, errors="raise")
+    with pytest.raises(ValueError):
+        is_wmo(12345.7, errors="raise")
+
+    with pytest.warns(UserWarning):
+        is_wmo(1234, errors="warn")
+    with pytest.warns(UserWarning):
+        is_wmo(-1234, errors="warn")
+    with pytest.warns(UserWarning):
+        is_wmo(1234.12, errors="warn")
+    with pytest.warns(UserWarning):
+        is_wmo(12345.7, errors="warn")
+
+    assert not is_wmo(12, errors="ignore")
+    assert not is_wmo(-12, errors="ignore")
+    assert not is_wmo(1234.12, errors="ignore")
+    assert not is_wmo(12345.7, errors="ignore")
+
+
+def test_check_wmo():
+    assert check_wmo(12345) == [12345]
+    assert check_wmo([1234567]) == [1234567]
+    assert check_wmo([12345, 1234567]) == [12345, 1234567]
+    assert check_wmo(np.array((12345, 1234567), dtype='int')) == [12345, 1234567]
+
+
+def test_is_cyc():
+    assert is_cyc(123)
+    assert is_cyc([123])
+    assert is_cyc([12, 123, 1234])
+
+    with pytest.raises(ValueError):
+        is_cyc(12345, errors="raise")
+    with pytest.raises(ValueError):
+        is_cyc(-1234, errors="raise")
+    with pytest.raises(ValueError):
+        is_cyc(1234.12, errors="raise")
+    with pytest.raises(ValueError):
+        is_cyc(12345.7, errors="raise")
+
+    with pytest.warns(UserWarning):
+        is_cyc(12345, errors="warn")
+    with pytest.warns(UserWarning):
+        is_cyc(-1234, errors="warn")
+    with pytest.warns(UserWarning):
+        is_cyc(1234.12, errors="warn")
+    with pytest.warns(UserWarning):
+        is_cyc(12345.7, errors="warn")
+
+    assert not is_cyc(12345, errors="ignore")
+    assert not is_cyc(-12, errors="ignore")
+    assert not is_cyc(1234.12, errors="ignore")
+    assert not is_cyc(12345.7, errors="ignore")
+
+
+def test_check_cyc():
+    assert check_cyc(123) == [123]
+    assert check_cyc([12]) == [12]
+    assert check_cyc([12, 123]) == [12, 123]
+    assert check_cyc(np.array((123, 1234), dtype='int')) == [123, 1234]
+
diff --git a/argopy/utilities.py b/argopy/utilities.py
index 396abe0b..955f3250 100644
--- a/argopy/utilities.py
+++ b/argopy/utilities.py
@@ -81,10 +81,6 @@
 
 log = logging.getLogger("argopy.utilities")
 
-with open(os.path.join(path2assets, "data_types.json"), "r") as f:
-    DATA_TYPES = json.load(f)
-
-
 
 def clear_cache(fs=None):
     """ Delete argopy cache folder content """
@@ -223,6 +219,7 @@ def load_dict(ptype):
     else:
         raise ValueError("Invalid dictionary name")
 
+
 def mapp_dict(Adictionnary, Avalue):
     if Avalue not in Adictionnary:
         return "Unknown"
@@ -230,202 +227,8 @@ def mapp_dict(Adictionnary, Avalue):
         return Adictionnary[Avalue]
 
 
-def list_available_data_src():
-    """ List all available data sources """
-    sources = {}
-    try:
-        from .data_fetchers import erddap_data as Erddap_Fetchers
-        # Ensure we're loading the erddap data fetcher with the current options:
-        Erddap_Fetchers.api_server_check = Erddap_Fetchers.api_server_check.replace(Erddap_Fetchers.api_server, OPTIONS['erddap'])
-        Erddap_Fetchers.api_server = OPTIONS['erddap']
-
-        sources["erddap"] = Erddap_Fetchers
-    except Exception:
-        warnings.warn(
-            "An error occurred while loading the ERDDAP data fetcher, "
-            "it will not be available !\n%s\n%s"
-            % (sys.exc_info()[0], sys.exc_info()[1])
-        )
-        pass
-
-    try:
-        from .data_fetchers import argovis_data as ArgoVis_Fetchers
-
-        sources["argovis"] = ArgoVis_Fetchers
-    except Exception:
-        warnings.warn(
-            "An error occurred while loading the ArgoVis data fetcher, "
-            "it will not be available !\n%s\n%s"
-            % (sys.exc_info()[0], sys.exc_info()[1])
-        )
-        pass
-
-    try:
-        from .data_fetchers import gdacftp_data as GDAC_Fetchers
-        # Ensure we're loading the gdac data fetcher with the current options:
-        GDAC_Fetchers.api_server_check = OPTIONS['ftp']
-        GDAC_Fetchers.api_server = OPTIONS['ftp']
-
-        sources["gdac"] = GDAC_Fetchers
-    except Exception:
-        warnings.warn(
-            "An error occurred while loading the GDAC data fetcher, "
-            "it will not be available !\n%s\n%s"
-            % (sys.exc_info()[0], sys.exc_info()[1])
-        )
-        pass
-
-    # return dict(sorted(sources.items()))
-    return sources
-
-
-def list_available_index_src():
-    """ List all available index sources """
-    sources = {}
-    try:
-        from .data_fetchers import erddap_index as Erddap_Fetchers
-        # Ensure we're loading the erddap data fetcher with the current options:
-        Erddap_Fetchers.api_server_check = Erddap_Fetchers.api_server_check.replace(Erddap_Fetchers.api_server, OPTIONS['erddap'])
-        Erddap_Fetchers.api_server = OPTIONS['erddap']
-
-        sources["erddap"] = Erddap_Fetchers
-    except Exception:
-        warnings.warn(
-            "An error occurred while loading the ERDDAP index fetcher, "
-            "it will not be available !\n%s\n%s"
-            % (sys.exc_info()[0], sys.exc_info()[1])
-        )
-        pass
-
-    try:
-        from .data_fetchers import gdacftp_index as GDAC_Fetchers
-        # Ensure we're loading the gdac data fetcher with the current options:
-        GDAC_Fetchers.api_server_check = OPTIONS['ftp']
-        GDAC_Fetchers.api_server = OPTIONS['ftp']
-
-        sources["gdac"] = GDAC_Fetchers
-    except Exception:
-        warnings.warn(
-            "An error occurred while loading the GDAC index fetcher, "
-            "it will not be available !\n%s\n%s"
-            % (sys.exc_info()[0], sys.exc_info()[1])
-        )
-        pass
-
-    return sources
-
-
-def list_standard_variables():
-    """ List of variables for standard users """
-    return [
-        "DATA_MODE",
-        "LATITUDE",
-        "LONGITUDE",
-        "POSITION_QC",
-        "DIRECTION",
-        "PLATFORM_NUMBER",
-        "CYCLE_NUMBER",
-        "PRES",
-        "TEMP",
-        "PSAL",
-        "PRES_QC",
-        "TEMP_QC",
-        "PSAL_QC",
-        "PRES_ADJUSTED",
-        "TEMP_ADJUSTED",
-        "PSAL_ADJUSTED",
-        "PRES_ADJUSTED_QC",
-        "TEMP_ADJUSTED_QC",
-        "PSAL_ADJUSTED_QC",
-        "PRES_ADJUSTED_ERROR",
-        "TEMP_ADJUSTED_ERROR",
-        "PSAL_ADJUSTED_ERROR",
-        "PRES_ERROR",  # can be created from PRES_ADJUSTED_ERROR after a filter_data_mode
-        "TEMP_ERROR",
-        "PSAL_ERROR",
-        "JULD",
-        "JULD_QC",
-        "TIME",
-        "TIME_QC",
-        # "CONFIG_MISSION_NUMBER",
-    ]
-
-
-def list_multiprofile_file_variables():
-    """ List of variables in a netcdf multiprofile file.
-
-        This is for files created by GDAC under <DAC>/<WMO>/<WMO>_prof.nc
-    """
-    return [
-        "CONFIG_MISSION_NUMBER",
-        "CYCLE_NUMBER",
-        "DATA_CENTRE",
-        "DATA_MODE",
-        "DATA_STATE_INDICATOR",
-        "DATA_TYPE",
-        "DATE_CREATION",
-        "DATE_UPDATE",
-        "DC_REFERENCE",
-        "DIRECTION",
-        "FIRMWARE_VERSION",
-        "FLOAT_SERIAL_NO",
-        "FORMAT_VERSION",
-        "HANDBOOK_VERSION",
-        "HISTORY_ACTION",
-        "HISTORY_DATE",
-        "HISTORY_INSTITUTION",
-        "HISTORY_PARAMETER",
-        "HISTORY_PREVIOUS_VALUE",
-        "HISTORY_QCTEST",
-        "HISTORY_REFERENCE",
-        "HISTORY_SOFTWARE",
-        "HISTORY_SOFTWARE_RELEASE",
-        "HISTORY_START_PRES",
-        "HISTORY_STEP",
-        "HISTORY_STOP_PRES",
-        "JULD",
-        "JULD_LOCATION",
-        "JULD_QC",
-        "LATITUDE",
-        "LONGITUDE",
-        "PARAMETER",
-        "PI_NAME",
-        "PLATFORM_NUMBER",
-        "PLATFORM_TYPE",
-        "POSITIONING_SYSTEM",
-        "POSITION_QC",
-        "PRES",
-        "PRES_ADJUSTED",
-        "PRES_ADJUSTED_ERROR",
-        "PRES_ADJUSTED_QC",
-        "PRES_QC",
-        "PROFILE_PRES_QC",
-        "PROFILE_PSAL_QC",
-        "PROFILE_TEMP_QC",
-        "PROJECT_NAME",
-        "PSAL",
-        "PSAL_ADJUSTED",
-        "PSAL_ADJUSTED_ERROR",
-        "PSAL_ADJUSTED_QC",
-        "PSAL_QC",
-        "REFERENCE_DATE_TIME",
-        "SCIENTIFIC_CALIB_COEFFICIENT",
-        "SCIENTIFIC_CALIB_COMMENT",
-        "SCIENTIFIC_CALIB_DATE",
-        "SCIENTIFIC_CALIB_EQUATION",
-        "STATION_PARAMETERS",
-        "TEMP",
-        "TEMP_ADJUSTED",
-        "TEMP_ADJUSTED_ERROR",
-        "TEMP_ADJUSTED_QC",
-        "TEMP_QC",
-        "VERTICAL_SAMPLING_SCHEME",
-        "WMO_INST_TYPE",
-    ]
-
-
 def get_sys_info():
-    "Returns system information as a dict"
+    """Returns system information as a dict"""
 
     blob = []
 
@@ -625,94 +428,6 @@ def show_options(file=sys.stdout):  # noqa: C901
         print(f"{k}: {v}", file=file)
 
 
-def check_gdac_path(path, errors='ignore'):  # noqa: C901
-    """ Check if a path has the expected GDAC ftp structure
-
-        Expected GDAC ftp structure::
-
-            .
-            └── dac
-                ├── aoml
-                ├── ...
-                ├── coriolis
-                ├── ...
-                ├── meds
-                └── nmdis
-
-        This check will return True if at least one DAC sub-folder is found under path/dac/<dac_name>
-
-        Examples::
-        >>> check_gdac_path("https://data-argo.ifremer.fr")  # True
-        >>> check_gdac_path("ftp://ftp.ifremer.fr/ifremer/argo") # True
-        >>> check_gdac_path("ftp://usgodae.org/pub/outgoing/argo") # True
-        >>> check_gdac_path("/home/ref-argo/gdac") # True
-        >>> check_gdac_path("https://www.ifremer.fr") # False
-        >>> check_gdac_path("ftp://usgodae.org/pub/outgoing") # False
-
-        Parameters
-        ----------
-        path: str
-            Path name to check, including access protocol
-        errors: str
-            "ignore" or "raise" (or "warn")
-
-        Returns
-        -------
-        checked: boolean
-            True if at least one DAC folder is found under path/dac/<dac_name>
-            False otherwise
-    """
-    # Create a file system for this path
-    if split_protocol(path)[0] is None:
-        fs = fsspec.filesystem('file')
-    elif 'https' in split_protocol(path)[0]:
-        fs = fsspec.filesystem('http')
-    elif 'ftp' in split_protocol(path)[0]:
-        try:
-            host = split_protocol(path)[-1].split('/')[0]
-            fs = fsspec.filesystem('ftp', host=host)
-        except gaierror:
-            if errors == 'raise':
-                raise FtpPathError("Can't get address info (GAIerror) on '%s'" % host)
-            elif errors == "warn":
-                warnings.warn("Can't get address info (GAIerror) on '%s'" % host)
-                return False
-            else:
-                return False
-    else:
-        raise FtpPathError("Unknown protocol for an Argo GDAC host: %s" % split_protocol(path)[0])
-
-    # dacs = [
-    #     "aoml",
-    #     "bodc",
-    #     "coriolis",
-    #     "csio",
-    #     "csiro",
-    #     "incois",
-    #     "jma",
-    #     "kma",
-    #     "kordi",
-    #     "meds",
-    #     "nmdis",
-    # ]
-
-    # Case 1:
-    check1 = (
-        fs.exists(path)
-        and fs.exists(fs.sep.join([path, "dac"]))
-        # and np.any([fs.exists(fs.sep.join([path, "dac", dac])) for dac in dacs])  # Take too much time on http/ftp GDAC server
-    )
-    if check1:
-        return True
-    elif errors == "raise":
-        raise FtpPathError("This path is not GDAC compliant (no `dac` folder with legitimate sub-folder):\n%s" % path)
-
-    elif errors == "warn":
-        warnings.warn("This path is not GDAC compliant:\n%s" % path)
-        return False
-    else:
-        return False
-
 
 def isconnected(host: str = "https://www.ifremer.fr", maxtry: int = 10):
     """Check if an URL is alive
@@ -1372,16 +1087,6 @@ def format_oneline(s, max_width=65):
         return s
 
 
-def to_list(obj):
-    """Make sure that an expected list is indeed a list"""
-    if not isinstance(obj, list):
-        if isinstance(obj, np.ndarray):
-            obj = list(obj)
-        else:
-            obj = [obj]
-    return obj
-
-
 def warnUnless(ok, txt):
     """Function to raise a warning unless condition is True
 
@@ -1843,157 +1548,6 @@ def fix_localhost(host):
     return dict(sorted(output.items()))
 
 
-class DocInherit(object):
-    """Docstring inheriting method descriptor
-
-    The class itself is also used as a decorator
-
-    Usage:
-
-    class Foo(object):
-        def foo(self):
-            "Frobber"
-            pass
-
-    class Bar(Foo):
-        @doc_inherit
-        def foo(self):
-            pass
-
-    Now, Bar.foo.__doc__ == Bar().foo.__doc__ == Foo.foo.__doc__ == "Frobber"
-
-    src: https://code.activestate.com/recipes/576862/
-    """
-
-    def __init__(self, mthd):
-        self.mthd = mthd
-        self.name = mthd.__name__
-
-    def __get__(self, obj, cls):
-        if obj:
-            return self.get_with_inst(obj, cls)
-        else:
-            return self.get_no_inst(cls)
-
-    def get_with_inst(self, obj, cls):
-
-        overridden = getattr(super(cls, obj), self.name, None)
-
-        @wraps(self.mthd, assigned=('__name__', '__module__'))
-        def f(*args, **kwargs):
-            return self.mthd(obj, *args, **kwargs)
-
-        return self.use_parent_doc(f, overridden)
-
-    def get_no_inst(self, cls):
-
-        for parent in cls.__mro__[1:]:
-            overridden = getattr(parent, self.name, None)
-            if overridden:
-                break
-
-        @wraps(self.mthd, assigned=('__name__', '__module__'))
-        def f(*args, **kwargs):
-            return self.mthd(*args, **kwargs)
-
-        return self.use_parent_doc(f, overridden)
-
-    def use_parent_doc(self, func, source):
-        if source is None:
-            raise NameError("Can't find '%s' in parents" % self.name)
-        func.__doc__ = source.__doc__
-        return func
-
-
-doc_inherit = DocInherit
-
-
-def deprecated(reason):
-    """Deprecation warning decorator.
-
-    This is a decorator which can be used to mark functions
-    as deprecated. It will result in a warning being emitted
-    when the function is used.
-
-    Parameters
-    ----------
-    reason: {str, None}
-        Text message to send with deprecation warning
-
-    Examples
-    --------
-    The @deprecated can be used with a 'reason'.
-
-        .. code-block:: python
-
-           @deprecated("please, use another function")
-           def old_function(x, y):
-             pass
-
-    or without:
-
-        .. code-block:: python
-
-           @deprecated
-           def old_function(x, y):
-             pass
-
-    References
-    ----------
-    https://stackoverflow.com/a/40301488
-    """
-    import inspect
-
-    if isinstance(reason, str):
-
-        def decorator(func1):
-
-            if inspect.isclass(func1):
-                fmt1 = "Call to deprecated class {name} ({reason})."
-            else:
-                fmt1 = "Call to deprecated function {name} ({reason})."
-
-            @wraps(func1)
-            def new_func1(*args, **kwargs):
-                warnings.simplefilter('always', DeprecationWarning)
-                warnings.warn(
-                    fmt1.format(name=func1.__name__, reason=reason),
-                    category=DeprecationWarning,
-                    stacklevel=2
-                )
-                warnings.simplefilter('default', DeprecationWarning)
-                return func1(*args, **kwargs)
-
-            return new_func1
-
-        return decorator
-
-    elif inspect.isclass(reason) or inspect.isfunction(reason):
-
-        func2 = reason
-
-        if inspect.isclass(func2):
-            fmt2 = "Call to deprecated class {name}."
-        else:
-            fmt2 = "Call to deprecated function {name}."
-
-        @wraps(func2)
-        def new_func2(*args, **kwargs):
-            warnings.simplefilter('always', DeprecationWarning)
-            warnings.warn(
-                fmt2.format(name=func2.__name__),
-                category=DeprecationWarning,
-                stacklevel=2
-            )
-            warnings.simplefilter('default', DeprecationWarning)
-            return func2(*args, **kwargs)
-
-        return new_func2
-
-    else:
-        raise TypeError(repr(type(reason)))
-
-
 class RegistryItem(ABC):
     """Prototype for possible custom items in a Registry"""
     @property
@@ -2246,456 +1800,6 @@ def copy(self):
         return self.__copy__()
 
 
-def get_coriolis_profile_id(WMO, CYC=None, **kwargs):
-    """ Return a :class:`pandas.DataFrame` with CORIOLIS ID of WMO/CYC profile pairs
-
-        This method get ID by requesting the dataselection.euro-argo.eu trajectory API.
-
-        Parameters
-        ----------
-        WMO: int, list(int)
-            Define the list of Argo floats. This is a list of integers with WMO float identifiers.
-            WMO is the World Meteorological Organization.
-        CYC: int, list(int)
-            Define the list of cycle numbers to load ID for each Argo floats listed in ``WMO``.
-
-        Returns
-        -------
-        :class:`pandas.DataFrame`
-    """
-    WMO_list = check_wmo(WMO)
-    if CYC is not None:
-        CYC_list = check_cyc(CYC)
-    if 'api_server' in kwargs:
-        api_server = kwargs['api_server']
-    elif OPTIONS['server'] is not None:
-        api_server = OPTIONS['server']
-    else:
-        api_server = "https://dataselection.euro-argo.eu/api"
-    URIs = [api_server + "/trajectory/%i" % wmo for wmo in WMO_list]
-
-    def prec(data, url):
-        # Transform trajectory json to dataframe
-        # See: https://dataselection.euro-argo.eu/swagger-ui.html#!/cycle-controller/getCyclesByPlatformCodeUsingGET
-        WMO = check_wmo(url.split("/")[-1])[0]
-        rows = []
-        for profile in data:
-            keys = [x for x in profile.keys() if x not in ["coordinate"]]
-            meta_row = dict((key, profile[key]) for key in keys)
-            for row in profile["coordinate"]:
-                meta_row[row] = profile["coordinate"][row]
-            meta_row["WMO"] = WMO
-            rows.append(meta_row)
-        return pd.DataFrame(rows)
-
-    from .stores import httpstore
-    fs = httpstore(cache=True, cachedir=OPTIONS['cachedir'])
-    data = fs.open_mfjson(URIs, preprocess=prec, errors="raise", url_follow=True)
-
-    # Merge results (list of dataframe):
-    key_map = {
-        "id": "ID",
-        "lat": "LATITUDE",
-        "lon": "LONGITUDE",
-        "cvNumber": "CYCLE_NUMBER",
-        "level": "level",
-        "WMO": "PLATFORM_NUMBER",
-    }
-    for i, df in enumerate(data):
-        df = df.reset_index()
-        df = df.rename(columns=key_map)
-        df = df[[value for value in key_map.values() if value in df.columns]]
-        data[i] = df
-    df = pd.concat(data, ignore_index=True)
-    df.sort_values(by=["PLATFORM_NUMBER", "CYCLE_NUMBER"], inplace=True)
-    df = df.reset_index(drop=True)
-    # df = df.set_index(["PLATFORM_NUMBER", "CYCLE_NUMBER"])
-    df = df.astype({"ID": int})
-    if CYC is not None:
-        df = pd.concat([df[df["CYCLE_NUMBER"] == cyc] for cyc in CYC_list]).reset_index(
-            drop=True
-        )
-    return df[
-        ["PLATFORM_NUMBER", "CYCLE_NUMBER", "ID", "LATITUDE", "LONGITUDE", "level"]
-    ]
-
-
-def get_ea_profile_page(WMO, CYC=None, **kwargs):
-    """ Return a list of URL
-
-        Parameters
-        ----------
-        WMO: int, list(int)
-            WMO must be an integer or an iterable with elements that can be casted as integers
-        CYC: int, list(int), default (None)
-            CYC must be an integer or an iterable with elements that can be casted as positive integers
-
-        Returns
-        -------
-        list(str)
-
-        See also
-        --------
-        get_coriolis_profile_id
-    """
-    df = get_coriolis_profile_id(WMO, CYC, **kwargs)
-    url = "https://dataselection.euro-argo.eu/cycle/{}"
-    return [url.format(this_id) for this_id in sorted(df["ID"])]
-
-
-@deprecated
-def cast_types(ds):  # noqa: C901
-    """ Make sure variables are of the appropriate types according to Argo
-
-    #todo: This is hard coded, but should be retrieved from an API somewhere.
-    Should be able to handle all possible variables encountered in the Argo dataset.
-
-    Parameter
-    ---------
-    :class:`xarray.DataSet`
-
-    Returns
-    -------
-    :class:`xarray.DataSet`
-    """
-
-    list_str = [
-        "PLATFORM_NUMBER",
-        "DATA_MODE",
-        "DIRECTION",
-        "DATA_CENTRE",
-        "DATA_TYPE",
-        "FORMAT_VERSION",
-        "HANDBOOK_VERSION",
-        "PROJECT_NAME",
-        "PI_NAME",
-        "STATION_PARAMETERS",
-        "DATA_CENTER",
-        "DC_REFERENCE",
-        "DATA_STATE_INDICATOR",
-        "PLATFORM_TYPE",
-        "FIRMWARE_VERSION",
-        "POSITIONING_SYSTEM",
-        "PROFILE_PRES_QC",
-        "PROFILE_PSAL_QC",
-        "PROFILE_TEMP_QC",
-        "PARAMETER",
-        "SCIENTIFIC_CALIB_EQUATION",
-        "SCIENTIFIC_CALIB_COEFFICIENT",
-        "SCIENTIFIC_CALIB_COMMENT",
-        "HISTORY_INSTITUTION",
-        "HISTORY_STEP",
-        "HISTORY_SOFTWARE",
-        "HISTORY_SOFTWARE_RELEASE",
-        "HISTORY_REFERENCE",
-        "HISTORY_QCTEST",
-        "HISTORY_ACTION",
-        "HISTORY_PARAMETER",
-        "VERTICAL_SAMPLING_SCHEME",
-        "FLOAT_SERIAL_NO",
-        "SOURCE",
-        "EXPOCODE",
-        "QCLEVEL",
-    ]
-    list_int = [
-        "PLATFORM_NUMBER",
-        "WMO_INST_TYPE",
-        "WMO_INST_TYPE",
-        "CYCLE_NUMBER",
-        "CONFIG_MISSION_NUMBER",
-    ]
-    list_datetime = [
-        "REFERENCE_DATE_TIME",
-        "DATE_CREATION",
-        "DATE_UPDATE",
-        "JULD",
-        "JULD_LOCATION",
-        "SCIENTIFIC_CALIB_DATE",
-        "HISTORY_DATE",
-        "TIME"
-    ]
-
-    def fix_weird_bytes(x):
-        x = x.replace(b"\xb1", b"+/-")
-        return x
-    fix_weird_bytes = np.vectorize(fix_weird_bytes)
-
-    def cast_this(da, type):
-        """ Low-level casting of DataArray values """
-        try:
-            da.values = da.values.astype(type)
-            da.attrs["casted"] = 1
-        except Exception:
-            msg = "Oops! %s occurred. Fail to cast <%s> into %s for: %s. Encountered unique values: %s" % (sys.exc_info()[0], str(da.dtype), type, da.name, str(np.unique(da)))
-            log.debug(msg)
-        return da
-
-    def cast_this_da(da):
-        """ Cast any DataArray """
-        v = da.name
-        da.attrs["casted"] = 0
-        if v in list_str and da.dtype == "O":  # Object
-            if v in ["SCIENTIFIC_CALIB_COEFFICIENT"]:
-                da.values = fix_weird_bytes(da.values)
-            da = cast_this(da, str)
-
-        if v in list_int:  # and da.dtype == 'O':  # Object
-            da = cast_this(da, np.int32)
-
-        if v in list_datetime and da.dtype == "O":  # Object
-            if (
-                "conventions" in da.attrs
-                and da.attrs["conventions"] == "YYYYMMDDHHMISS"
-            ):
-                if da.size != 0:
-                    if len(da.dims) <= 1:
-                        val = da.astype(str).values.astype("U14")
-                        # This should not happen, but still ! That's real world data
-                        val[val == "              "] = "nan"
-                        da.values = pd.to_datetime(val, format="%Y%m%d%H%M%S")
-                    else:
-                        s = da.stack(dummy_index=da.dims)
-                        val = s.astype(str).values.astype("U14")
-                        # This should not happen, but still ! That's real world data
-                        val[val == ""] = "nan"
-                        val[val == "              "] = "nan"
-                        #
-                        s.values = pd.to_datetime(val, format="%Y%m%d%H%M%S")
-                        da.values = s.unstack("dummy_index")
-                    da = cast_this(da, 'datetime64[s]')
-                else:
-                    da = cast_this(da, 'datetime64[s]')
-
-            elif v == "SCIENTIFIC_CALIB_DATE":
-                da = cast_this(da, str)
-                s = da.stack(dummy_index=da.dims)
-                s.values = pd.to_datetime(s.values, format="%Y%m%d%H%M%S")
-                da.values = (s.unstack("dummy_index")).values
-                da = cast_this(da, 'datetime64[s]')
-
-        if "QC" in v and "PROFILE" not in v and "QCTEST" not in v:
-            if da.dtype == "O":  # convert object to string
-                da = cast_this(da, str)
-
-            # Address weird string values:
-            # (replace missing or nan values by a '0' that will be cast as an integer later
-
-            if da.dtype == "<U3":  # string, len 3 because of a 'nan' somewhere
-                ii = (
-                    da == "   "
-                )  # This should not happen, but still ! That's real world data
-                da = xr.where(ii, "0", da)
-
-                ii = (
-                    da == "nan"
-                )  # This should not happen, but still ! That's real world data
-                da = xr.where(ii, "0", da)
-
-                # Get back to regular U1 string
-                da = cast_this(da, np.dtype("U1"))
-
-            if da.dtype == "<U1":  # string
-                ii = (
-                    da == ""
-                )  # This should not happen, but still ! That's real world data
-                da = xr.where(ii, "0", da)
-
-                ii = (
-                    da == " "
-                )  # This should not happen, but still ! That's real world data
-                da = xr.where(ii, "0", da)
-
-                ii = (
-                    da == "n"
-                )  # This should not happen, but still ! That's real world data
-                da = xr.where(ii, "0", da)
-
-            # finally convert QC strings to integers:
-            da = cast_this(da, np.int32)
-
-        if da.dtype == 'O':
-            # By default, try to cast as float:
-            da = cast_this(da, np.float32)
-
-        if da.dtype != "O":
-            da.attrs["casted"] = 1
-
-        return da
-
-    for v in ds.variables:
-        try:
-            ds[v] = cast_this_da(ds[v])
-        except Exception:
-            print("Oops!", sys.exc_info()[0], "occurred.")
-            print("Fail to cast: %s " % v)
-            print("Encountered unique values:", np.unique(ds[v]))
-            raise
-
-    return ds
-
-
-def cast_Argo_variable_type(ds, overwrite=True):
-    """ Ensure that all dataset variables are of the appropriate types according to Argo references
-
-    Parameter
-    ---------
-    :class:`xarray.DataSet`
-    overwrite: bool, default=True
-        Should we force to re-cast a variable we already casted in this dataset ?
-
-    Returns
-    -------
-    :class:`xarray.DataSet`
-    """
-    def cast_this(da, type):
-        """ Low-level casting of DataArray values """
-        try:
-            da = da.astype(type)
-            # with warnings.catch_warnings():
-            #     warnings.filterwarnings('error')
-            #     try:
-            #         da = da.astype(type)
-            #     except Warning:
-            #         log.debug(type)
-            #         log.debug(da.attrs)
-            da.attrs["casted"] = 1
-        except Exception:
-            print("Oops!", sys.exc_info()[0], "occurred.")
-            print("Fail to cast %s[%s] from '%s' to %s" % (da.name, da.dims, da.dtype, type))
-            try:
-                print("Unique values:", np.unique(da))
-            except Exception:
-                print("Can't read unique values !")
-                pass
-        return da
-
-    def cast_this_da(da, v):
-        """ Cast any Argo DataArray """
-        # print("Casting %s ..." % da.name)
-        da.attrs["casted"] = 0
-
-        if v in DATA_TYPES['data']['str'] and da.dtype == "O":  # Object
-            da = cast_this(da, str)
-
-        if v in DATA_TYPES['data']['int']:  # and da.dtype == 'O':  # Object
-            if "conventions" in da.attrs:
-                convname = "conventions"
-            elif "convention" in da.attrs:
-                convname = "convention"
-            else:
-                convname = None
-            if (
-                    convname in da.attrs
-                    and da.attrs[convname] in ["Argo reference table 19",
-                                               "Argo reference table 21",
-                                               "WMO float identifier : A9IIIII",
-                                               "1...N, 1 : first complete mission",
-                                               ]
-            ):
-                # Some values may be missing, and the _FillValue=" " cannot be casted as an integer.
-                # so, we replace missing values with a 999:
-                val = da.astype(str).values
-                # val[np.where(val == 'nan')] = '999'
-                val[val == 'nan'] = '999'
-                da.values = val
-            da = cast_this(da, float)
-            da = cast_this(da, int)
-
-        if v in DATA_TYPES['data']['datetime'] and da.dtype == "O":  # Object
-            if (
-                    "conventions" in da.attrs
-                    and da.attrs["conventions"] == "YYYYMMDDHHMISS"
-            ):
-                if da.size != 0:
-                    if len(da.dims) <= 1:
-                        val = da.astype(str).values.astype("U14")
-                        # This should not happen, but still ! That's real world data
-                        val[val == "              "] = "nan"
-                        da.values = pd.to_datetime(val, format="%Y%m%d%H%M%S")
-                    else:
-                        s = da.stack(dummy_index=da.dims)
-                        val = s.astype(str).values.astype("U14")
-                        # This should not happen, but still ! That's real world data
-                        val[val == "              "] = "nan"
-                        s.values = pd.to_datetime(val, format="%Y%m%d%H%M%S")
-                        da.values = s.unstack("dummy_index")
-                    da = cast_this(da, 'datetime64[ns]')
-                else:
-                    da = cast_this(da, 'datetime64[ns]')
-
-            elif v == "SCIENTIFIC_CALIB_DATE":
-                da = cast_this(da, str)
-                s = da.stack(dummy_index=da.dims)
-                s.values = pd.to_datetime(s.values, format="%Y%m%d%H%M%S")
-                da.values = (s.unstack("dummy_index")).values
-                da = cast_this(da, 'datetime64[ns]')
-
-        if "QC" in v and "PROFILE" not in v and "QCTEST" not in v:
-            if da.dtype == "O":  # convert object to string
-                da = cast_this(da, str)
-
-            # Address weird string values:
-            # (replace missing or nan values by a '0' that will be cast as an integer later
-            if da.dtype == float:
-                val = da.astype(str).values
-                val[np.where(val == 'nan')] = '0'
-                da.values = val
-                da = cast_this(da, float)
-
-            if da.dtype == "<U3":  # string, len 3 because of a 'nan' somewhere
-                ii = (
-                        da == "   "
-                )  # This should not happen, but still ! That's real world data
-                da = xr.where(ii, "0", da)
-
-                ii = (
-                        da == "nan"
-                )  # This should not happen, but still ! That's real world data
-                da = xr.where(ii, "0", da)
-
-                # Get back to regular U1 string
-                da = cast_this(da, np.dtype("U1"))
-
-            if da.dtype == "<U1":  # string
-                ii = (
-                        da == ""
-                )  # This should not happen, but still ! That's real world data
-                da = xr.where(ii, "0", da)
-
-                ii = (
-                        da == " "
-                )  # This should not happen, but still ! That's real world data
-                da = xr.where(ii, "0", da)
-
-                ii = (
-                        da == "n"
-                )  # This should not happen, but still ! That's real world data
-                da = xr.where(ii, "0", da)
-
-            # finally convert QC strings to integers:
-            da = cast_this(da, int)
-
-        if "DATA_MODE" in v:
-            da = cast_this(da, '<U1')
-
-        if da.dtype != "O":
-            da.attrs["casted"] = 1
-
-        return da
-
-    for v in ds.variables:
-        if overwrite or ('casted' in ds[v].attrs and ds[v].attrs['casted'] == 0):
-            try:
-                ds[v] = cast_this_da(ds[v], v)
-            except Exception:
-                print("Oops!", sys.exc_info()[0], "occurred.")
-                print("Fail to cast: %s " % v)
-                print("Encountered unique values:", np.unique(ds[v]))
-                raise
-
-    return ds
-
-
 def log_argopy_callerstack(level='debug'):
     """log the caller’s stack"""
     froot = str(pathlib.Path(__file__).parent.resolve())
diff --git a/argopy/utils/__init__.py b/argopy/utils/__init__.py
index a80c00f1..acdfe1ce 100644
--- a/argopy/utils/__init__.py
+++ b/argopy/utils/__init__.py
@@ -5,7 +5,18 @@
     is_wmo, check_wmo,
     is_cyc, check_cyc,
     check_index_cols,
+    check_gdac_path,
 )
+from .casting import DATA_TYPES, cast_Argo_variable_type, to_list
+from .decorators import deprecated, doc_inherit
+from .lists import (
+    list_available_data_src,
+    list_available_index_src,
+    list_standard_variables,
+    list_multiprofile_file_variables
+)
+
+
 
 __all__ = (
     # Classes:
@@ -17,4 +28,20 @@
     "is_wmo", "check_wmo",
     "is_cyc", "check_cyc",
     "check_index_cols",
+    "check_gdac_path",
+
+    # Data type casting:
+    "DATA_TYPES",
+    "cast_Argo_variable_type",
+    "to_list",
+
+    # Decorators:
+    "deprecated",
+    "doc_inherit",
+
+    # Lists:
+    "list_available_data_src",
+    "list_available_index_src",
+    "list_standard_variables",
+    "list_multiprofile_file_variables",
 )
diff --git a/argopy/utils/casting.py b/argopy/utils/casting.py
new file mode 100644
index 00000000..eafae65a
--- /dev/null
+++ b/argopy/utils/casting.py
@@ -0,0 +1,376 @@
+import sys
+import os
+import numpy as np
+import pandas as pd
+import xarray as xr
+import importlib
+import json
+
+path2assets = importlib.util.find_spec('argopy.static.assets').submodule_search_locations[0]
+
+with open(os.path.join(path2assets, "data_types.json"), "r") as f:
+    DATA_TYPES = json.load(f)
+
+
+@deprecated
+def cast_types(ds):  # noqa: C901
+    """ Make sure variables are of the appropriate types according to Argo
+
+    #todo: This is hard coded, but should be retrieved from an API somewhere.
+    Should be able to handle all possible variables encountered in the Argo dataset.
+
+    Parameter
+    ---------
+    :class:`xarray.DataSet`
+
+    Returns
+    -------
+    :class:`xarray.DataSet`
+    """
+
+    list_str = [
+        "PLATFORM_NUMBER",
+        "DATA_MODE",
+        "DIRECTION",
+        "DATA_CENTRE",
+        "DATA_TYPE",
+        "FORMAT_VERSION",
+        "HANDBOOK_VERSION",
+        "PROJECT_NAME",
+        "PI_NAME",
+        "STATION_PARAMETERS",
+        "DATA_CENTER",
+        "DC_REFERENCE",
+        "DATA_STATE_INDICATOR",
+        "PLATFORM_TYPE",
+        "FIRMWARE_VERSION",
+        "POSITIONING_SYSTEM",
+        "PROFILE_PRES_QC",
+        "PROFILE_PSAL_QC",
+        "PROFILE_TEMP_QC",
+        "PARAMETER",
+        "SCIENTIFIC_CALIB_EQUATION",
+        "SCIENTIFIC_CALIB_COEFFICIENT",
+        "SCIENTIFIC_CALIB_COMMENT",
+        "HISTORY_INSTITUTION",
+        "HISTORY_STEP",
+        "HISTORY_SOFTWARE",
+        "HISTORY_SOFTWARE_RELEASE",
+        "HISTORY_REFERENCE",
+        "HISTORY_QCTEST",
+        "HISTORY_ACTION",
+        "HISTORY_PARAMETER",
+        "VERTICAL_SAMPLING_SCHEME",
+        "FLOAT_SERIAL_NO",
+        "SOURCE",
+        "EXPOCODE",
+        "QCLEVEL",
+    ]
+    list_int = [
+        "PLATFORM_NUMBER",
+        "WMO_INST_TYPE",
+        "WMO_INST_TYPE",
+        "CYCLE_NUMBER",
+        "CONFIG_MISSION_NUMBER",
+    ]
+    list_datetime = [
+        "REFERENCE_DATE_TIME",
+        "DATE_CREATION",
+        "DATE_UPDATE",
+        "JULD",
+        "JULD_LOCATION",
+        "SCIENTIFIC_CALIB_DATE",
+        "HISTORY_DATE",
+        "TIME"
+    ]
+
+    def fix_weird_bytes(x):
+        x = x.replace(b"\xb1", b"+/-")
+        return x
+    fix_weird_bytes = np.vectorize(fix_weird_bytes)
+
+    def cast_this(da, type):
+        """ Low-level casting of DataArray values """
+        try:
+            da.values = da.values.astype(type)
+            da.attrs["casted"] = 1
+        except Exception:
+            msg = "Oops! %s occurred. Fail to cast <%s> into %s for: %s. Encountered unique values: %s" % (sys.exc_info()[0], str(da.dtype), type, da.name, str(np.unique(da)))
+            log.debug(msg)
+        return da
+
+    def cast_this_da(da):
+        """ Cast any DataArray """
+        v = da.name
+        da.attrs["casted"] = 0
+        if v in list_str and da.dtype == "O":  # Object
+            if v in ["SCIENTIFIC_CALIB_COEFFICIENT"]:
+                da.values = fix_weird_bytes(da.values)
+            da = cast_this(da, str)
+
+        if v in list_int:  # and da.dtype == 'O':  # Object
+            da = cast_this(da, np.int32)
+
+        if v in list_datetime and da.dtype == "O":  # Object
+            if (
+                "conventions" in da.attrs
+                and da.attrs["conventions"] == "YYYYMMDDHHMISS"
+            ):
+                if da.size != 0:
+                    if len(da.dims) <= 1:
+                        val = da.astype(str).values.astype("U14")
+                        # This should not happen, but still ! That's real world data
+                        val[val == "              "] = "nan"
+                        da.values = pd.to_datetime(val, format="%Y%m%d%H%M%S")
+                    else:
+                        s = da.stack(dummy_index=da.dims)
+                        val = s.astype(str).values.astype("U14")
+                        # This should not happen, but still ! That's real world data
+                        val[val == ""] = "nan"
+                        val[val == "              "] = "nan"
+                        #
+                        s.values = pd.to_datetime(val, format="%Y%m%d%H%M%S")
+                        da.values = s.unstack("dummy_index")
+                    da = cast_this(da, 'datetime64[s]')
+                else:
+                    da = cast_this(da, 'datetime64[s]')
+
+            elif v == "SCIENTIFIC_CALIB_DATE":
+                da = cast_this(da, str)
+                s = da.stack(dummy_index=da.dims)
+                s.values = pd.to_datetime(s.values, format="%Y%m%d%H%M%S")
+                da.values = (s.unstack("dummy_index")).values
+                da = cast_this(da, 'datetime64[s]')
+
+        if "QC" in v and "PROFILE" not in v and "QCTEST" not in v:
+            if da.dtype == "O":  # convert object to string
+                da = cast_this(da, str)
+
+            # Address weird string values:
+            # (replace missing or nan values by a '0' that will be cast as an integer later
+
+            if da.dtype == "<U3":  # string, len 3 because of a 'nan' somewhere
+                ii = (
+                    da == "   "
+                )  # This should not happen, but still ! That's real world data
+                da = xr.where(ii, "0", da)
+
+                ii = (
+                    da == "nan"
+                )  # This should not happen, but still ! That's real world data
+                da = xr.where(ii, "0", da)
+
+                # Get back to regular U1 string
+                da = cast_this(da, np.dtype("U1"))
+
+            if da.dtype == "<U1":  # string
+                ii = (
+                    da == ""
+                )  # This should not happen, but still ! That's real world data
+                da = xr.where(ii, "0", da)
+
+                ii = (
+                    da == " "
+                )  # This should not happen, but still ! That's real world data
+                da = xr.where(ii, "0", da)
+
+                ii = (
+                    da == "n"
+                )  # This should not happen, but still ! That's real world data
+                da = xr.where(ii, "0", da)
+
+            # finally convert QC strings to integers:
+            da = cast_this(da, np.int32)
+
+        if da.dtype == 'O':
+            # By default, try to cast as float:
+            da = cast_this(da, np.float32)
+
+        if da.dtype != "O":
+            da.attrs["casted"] = 1
+
+        return da
+
+    for v in ds.variables:
+        try:
+            ds[v] = cast_this_da(ds[v])
+        except Exception:
+            print("Oops!", sys.exc_info()[0], "occurred.")
+            print("Fail to cast: %s " % v)
+            print("Encountered unique values:", np.unique(ds[v]))
+            raise
+
+    return ds
+
+
+def cast_Argo_variable_type(ds, overwrite=True):
+    """ Ensure that all dataset variables are of the appropriate types according to Argo references
+
+    Parameter
+    ---------
+    :class:`xarray.DataSet`
+    overwrite: bool, default=True
+        Should we force to re-cast a variable we already casted in this dataset ?
+
+    Returns
+    -------
+    :class:`xarray.DataSet`
+    """
+    def cast_this(da, type):
+        """ Low-level casting of DataArray values """
+        try:
+            da = da.astype(type)
+            # with warnings.catch_warnings():
+            #     warnings.filterwarnings('error')
+            #     try:
+            #         da = da.astype(type)
+            #     except Warning:
+            #         log.debug(type)
+            #         log.debug(da.attrs)
+            da.attrs["casted"] = 1
+        except Exception:
+            print("Oops!", sys.exc_info()[0], "occurred.")
+            print("Fail to cast %s[%s] from '%s' to %s" % (da.name, da.dims, da.dtype, type))
+            try:
+                print("Unique values:", np.unique(da))
+            except Exception:
+                print("Can't read unique values !")
+                pass
+        return da
+
+    def cast_this_da(da, v):
+        """ Cast any Argo DataArray """
+        # print("Casting %s ..." % da.name)
+        da.attrs["casted"] = 0
+
+        if v in DATA_TYPES['data']['str'] and da.dtype == "O":  # Object
+            da = cast_this(da, str)
+
+        if v in DATA_TYPES['data']['int']:  # and da.dtype == 'O':  # Object
+            if "conventions" in da.attrs:
+                convname = "conventions"
+            elif "convention" in da.attrs:
+                convname = "convention"
+            else:
+                convname = None
+            if (
+                    convname in da.attrs
+                    and da.attrs[convname] in ["Argo reference table 19",
+                                               "Argo reference table 21",
+                                               "WMO float identifier : A9IIIII",
+                                               "1...N, 1 : first complete mission",
+                                               ]
+            ):
+                # Some values may be missing, and the _FillValue=" " cannot be casted as an integer.
+                # so, we replace missing values with a 999:
+                val = da.astype(str).values
+                # val[np.where(val == 'nan')] = '999'
+                val[val == 'nan'] = '999'
+                da.values = val
+            da = cast_this(da, float)
+            da = cast_this(da, int)
+
+        if v in DATA_TYPES['data']['datetime'] and da.dtype == "O":  # Object
+            if (
+                    "conventions" in da.attrs
+                    and da.attrs["conventions"] == "YYYYMMDDHHMISS"
+            ):
+                if da.size != 0:
+                    if len(da.dims) <= 1:
+                        val = da.astype(str).values.astype("U14")
+                        # This should not happen, but still ! That's real world data
+                        val[val == "              "] = "nan"
+                        da.values = pd.to_datetime(val, format="%Y%m%d%H%M%S")
+                    else:
+                        s = da.stack(dummy_index=da.dims)
+                        val = s.astype(str).values.astype("U14")
+                        # This should not happen, but still ! That's real world data
+                        val[val == "              "] = "nan"
+                        s.values = pd.to_datetime(val, format="%Y%m%d%H%M%S")
+                        da.values = s.unstack("dummy_index")
+                    da = cast_this(da, 'datetime64[ns]')
+                else:
+                    da = cast_this(da, 'datetime64[ns]')
+
+            elif v == "SCIENTIFIC_CALIB_DATE":
+                da = cast_this(da, str)
+                s = da.stack(dummy_index=da.dims)
+                s.values = pd.to_datetime(s.values, format="%Y%m%d%H%M%S")
+                da.values = (s.unstack("dummy_index")).values
+                da = cast_this(da, 'datetime64[ns]')
+
+        if "QC" in v and "PROFILE" not in v and "QCTEST" not in v:
+            if da.dtype == "O":  # convert object to string
+                da = cast_this(da, str)
+
+            # Address weird string values:
+            # (replace missing or nan values by a '0' that will be cast as an integer later
+            if da.dtype == float:
+                val = da.astype(str).values
+                val[np.where(val == 'nan')] = '0'
+                da.values = val
+                da = cast_this(da, float)
+
+            if da.dtype == "<U3":  # string, len 3 because of a 'nan' somewhere
+                ii = (
+                        da == "   "
+                )  # This should not happen, but still ! That's real world data
+                da = xr.where(ii, "0", da)
+
+                ii = (
+                        da == "nan"
+                )  # This should not happen, but still ! That's real world data
+                da = xr.where(ii, "0", da)
+
+                # Get back to regular U1 string
+                da = cast_this(da, np.dtype("U1"))
+
+            if da.dtype == "<U1":  # string
+                ii = (
+                        da == ""
+                )  # This should not happen, but still ! That's real world data
+                da = xr.where(ii, "0", da)
+
+                ii = (
+                        da == " "
+                )  # This should not happen, but still ! That's real world data
+                da = xr.where(ii, "0", da)
+
+                ii = (
+                        da == "n"
+                )  # This should not happen, but still ! That's real world data
+                da = xr.where(ii, "0", da)
+
+            # finally convert QC strings to integers:
+            da = cast_this(da, int)
+
+        if "DATA_MODE" in v:
+            da = cast_this(da, '<U1')
+
+        if da.dtype != "O":
+            da.attrs["casted"] = 1
+
+        return da
+
+    for v in ds.variables:
+        if overwrite or ('casted' in ds[v].attrs and ds[v].attrs['casted'] == 0):
+            try:
+                ds[v] = cast_this_da(ds[v], v)
+            except Exception:
+                print("Oops!", sys.exc_info()[0], "occurred.")
+                print("Fail to cast: %s " % v)
+                print("Encountered unique values:", np.unique(ds[v]))
+                raise
+
+    return ds
+
+
+def to_list(obj):
+    """Make sure that an expected list is indeed a list"""
+    if not isinstance(obj, list):
+        if isinstance(obj, np.ndarray):
+            obj = list(obj)
+        else:
+            obj = [obj]
+    return obj
+
diff --git a/argopy/utils/checkers.py b/argopy/utils/checkers.py
index 6342c415..2c8cfb53 100644
--- a/argopy/utils/checkers.py
+++ b/argopy/utils/checkers.py
@@ -2,8 +2,11 @@
 import numpy as np
 import pandas as pd
 import xarray as xr
-from ..utilities import to_list
-from ..errors import InvalidDatasetStructure
+from fsspec.core import split_protocol
+import fsspec
+from socket import gaierror
+from ..utils import to_list
+from ..errors import InvalidDatasetStructure, FtpPathError
 
 
 def is_indexbox(box: list, errors="raise"):
@@ -375,3 +378,93 @@ def check_index_cols(column_names: list, convention: str = 'ar_index_global_prof
         raise InvalidDatasetStructure("Unexpected column names in this index !")
     else:
         return column_names
+
+
+def check_gdac_path(path, errors='ignore'):  # noqa: C901
+    """ Check if a path has the expected GDAC ftp structure
+
+        Expected GDAC ftp structure::
+
+            .
+            └── dac
+                ├── aoml
+                ├── ...
+                ├── coriolis
+                ├── ...
+                ├── meds
+                └── nmdis
+
+        This check will return True if at least one DAC sub-folder is found under path/dac/<dac_name>
+
+        Examples::
+        >>> check_gdac_path("https://data-argo.ifremer.fr")  # True
+        >>> check_gdac_path("ftp://ftp.ifremer.fr/ifremer/argo") # True
+        >>> check_gdac_path("ftp://usgodae.org/pub/outgoing/argo") # True
+        >>> check_gdac_path("/home/ref-argo/gdac") # True
+        >>> check_gdac_path("https://www.ifremer.fr") # False
+        >>> check_gdac_path("ftp://usgodae.org/pub/outgoing") # False
+
+        Parameters
+        ----------
+        path: str
+            Path name to check, including access protocol
+        errors: str
+            "ignore" or "raise" (or "warn")
+
+        Returns
+        -------
+        checked: boolean
+            True if at least one DAC folder is found under path/dac/<dac_name>
+            False otherwise
+    """
+    # Create a file system for this path
+    if split_protocol(path)[0] is None:
+        fs = fsspec.filesystem('file')
+    elif 'https' in split_protocol(path)[0]:
+        fs = fsspec.filesystem('http')
+    elif 'ftp' in split_protocol(path)[0]:
+        try:
+            host = split_protocol(path)[-1].split('/')[0]
+            fs = fsspec.filesystem('ftp', host=host)
+        except gaierror:
+            if errors == 'raise':
+                raise FtpPathError("Can't get address info (GAIerror) on '%s'" % host)
+            elif errors == "warn":
+                warnings.warn("Can't get address info (GAIerror) on '%s'" % host)
+                return False
+            else:
+                return False
+    else:
+        raise FtpPathError("Unknown protocol for an Argo GDAC host: %s" % split_protocol(path)[0])
+
+    # dacs = [
+    #     "aoml",
+    #     "bodc",
+    #     "coriolis",
+    #     "csio",
+    #     "csiro",
+    #     "incois",
+    #     "jma",
+    #     "kma",
+    #     "kordi",
+    #     "meds",
+    #     "nmdis",
+    # ]
+
+    # Case 1:
+    check1 = (
+        fs.exists(path)
+        and fs.exists(fs.sep.join([path, "dac"]))
+        # and np.any([fs.exists(fs.sep.join([path, "dac", dac])) for dac in dacs])  # Take too much time on http/ftp GDAC server
+    )
+    if check1:
+        return True
+    elif errors == "raise":
+        raise FtpPathError("This path is not GDAC compliant (no `dac` folder with legitimate sub-folder):\n%s" % path)
+
+    elif errors == "warn":
+        warnings.warn("This path is not GDAC compliant:\n%s" % path)
+        return False
+    else:
+        return False
+
diff --git a/argopy/utils/decorators.py b/argopy/utils/decorators.py
new file mode 100644
index 00000000..6cff7e56
--- /dev/null
+++ b/argopy/utils/decorators.py
@@ -0,0 +1,154 @@
+from functools import wraps
+import warnings
+
+
+class DocInherit(object):
+    """Docstring inheriting method descriptor
+
+    The class itself is also used as a decorator
+
+    Usage:
+
+    class Foo(object):
+        def foo(self):
+            "Frobber"
+            pass
+
+    class Bar(Foo):
+        @doc_inherit
+        def foo(self):
+            pass
+
+    Now, Bar.foo.__doc__ == Bar().foo.__doc__ == Foo.foo.__doc__ == "Frobber"
+
+    src: https://code.activestate.com/recipes/576862/
+    """
+
+    def __init__(self, mthd):
+        self.mthd = mthd
+        self.name = mthd.__name__
+
+    def __get__(self, obj, cls):
+        if obj:
+            return self.get_with_inst(obj, cls)
+        else:
+            return self.get_no_inst(cls)
+
+    def get_with_inst(self, obj, cls):
+
+        overridden = getattr(super(cls, obj), self.name, None)
+
+        @wraps(self.mthd, assigned=('__name__', '__module__'))
+        def f(*args, **kwargs):
+            return self.mthd(obj, *args, **kwargs)
+
+        return self.use_parent_doc(f, overridden)
+
+    def get_no_inst(self, cls):
+
+        for parent in cls.__mro__[1:]:
+            overridden = getattr(parent, self.name, None)
+            if overridden:
+                break
+
+        @wraps(self.mthd, assigned=('__name__', '__module__'))
+        def f(*args, **kwargs):
+            return self.mthd(*args, **kwargs)
+
+        return self.use_parent_doc(f, overridden)
+
+    def use_parent_doc(self, func, source):
+        if source is None:
+            raise NameError("Can't find '%s' in parents" % self.name)
+        func.__doc__ = source.__doc__
+        return func
+
+
+doc_inherit = DocInherit
+
+
+def deprecated(reason):
+    """Deprecation warning decorator.
+
+    This is a decorator which can be used to mark functions
+    as deprecated. It will result in a warning being emitted
+    when the function is used.
+
+    Parameters
+    ----------
+    reason: {str, None}
+        Text message to send with deprecation warning
+
+    Examples
+    --------
+    The @deprecated can be used with a 'reason'.
+
+        .. code-block:: python
+
+           @deprecated("please, use another function")
+           def old_function(x, y):
+             pass
+
+    or without:
+
+        .. code-block:: python
+
+           @deprecated
+           def old_function(x, y):
+             pass
+
+    References
+    ----------
+    https://stackoverflow.com/a/40301488
+    """
+    import inspect
+
+    if isinstance(reason, str):
+
+        def decorator(func1):
+
+            if inspect.isclass(func1):
+                fmt1 = "Call to deprecated class {name} ({reason})."
+            else:
+                fmt1 = "Call to deprecated function {name} ({reason})."
+
+            @wraps(func1)
+            def new_func1(*args, **kwargs):
+                warnings.simplefilter('always', DeprecationWarning)
+                warnings.warn(
+                    fmt1.format(name=func1.__name__, reason=reason),
+                    category=DeprecationWarning,
+                    stacklevel=2
+                )
+                warnings.simplefilter('default', DeprecationWarning)
+                return func1(*args, **kwargs)
+
+            return new_func1
+
+        return decorator
+
+    elif inspect.isclass(reason) or inspect.isfunction(reason):
+
+        func2 = reason
+
+        if inspect.isclass(func2):
+            fmt2 = "Call to deprecated class {name}."
+        else:
+            fmt2 = "Call to deprecated function {name}."
+
+        @wraps(func2)
+        def new_func2(*args, **kwargs):
+            warnings.simplefilter('always', DeprecationWarning)
+            warnings.warn(
+                fmt2.format(name=func2.__name__),
+                category=DeprecationWarning,
+                stacklevel=2
+            )
+            warnings.simplefilter('default', DeprecationWarning)
+            return func2(*args, **kwargs)
+
+        return new_func2
+
+    else:
+        raise TypeError(repr(type(reason)))
+
diff --git a/argopy/utils/lists.py b/argopy/utils/lists.py
new file mode 100644
index 00000000..78567313
--- /dev/null
+++ b/argopy/utils/lists.py
@@ -0,0 +1,198 @@
+import sys
+import warnings
+from ..options import OPTIONS
+
+
+def list_available_data_src():
+    """ List all available data sources """
+    sources = {}
+    try:
+        from ..data_fetchers import erddap_data as Erddap_Fetchers
+        # Ensure we're loading the erddap data fetcher with the current options:
+        Erddap_Fetchers.api_server_check = Erddap_Fetchers.api_server_check.replace(Erddap_Fetchers.api_server, OPTIONS['erddap'])
+        Erddap_Fetchers.api_server = OPTIONS['erddap']
+
+        sources["erddap"] = Erddap_Fetchers
+    except Exception:
+        warnings.warn(
+            "An error occurred while loading the ERDDAP data fetcher, "
+            "it will not be available !\n%s\n%s"
+            % (sys.exc_info()[0], sys.exc_info()[1])
+        )
+        pass
+
+    try:
+        from ..data_fetchers import argovis_data as ArgoVis_Fetchers
+
+        sources["argovis"] = ArgoVis_Fetchers
+    except Exception:
+        warnings.warn(
+            "An error occurred while loading the ArgoVis data fetcher, "
+            "it will not be available !\n%s\n%s"
+            % (sys.exc_info()[0], sys.exc_info()[1])
+        )
+        pass
+
+    try:
+        from ..data_fetchers import gdacftp_data as GDAC_Fetchers
+        # Ensure we're loading the gdac data fetcher with the current options:
+        GDAC_Fetchers.api_server_check = OPTIONS['ftp']
+        GDAC_Fetchers.api_server = OPTIONS['ftp']
+
+        sources["gdac"] = GDAC_Fetchers
+    except Exception:
+        warnings.warn(
+            "An error occurred while loading the GDAC data fetcher, "
+            "it will not be available !\n%s\n%s"
+            % (sys.exc_info()[0], sys.exc_info()[1])
+        )
+        pass
+
+    # return dict(sorted(sources.items()))
+    return sources
+
+
+def list_available_index_src():
+    """ List all available index sources """
+    sources = {}
+    try:
+        from ..data_fetchers import erddap_index as Erddap_Fetchers
+        # Ensure we're loading the erddap data fetcher with the current options:
+        Erddap_Fetchers.api_server_check = Erddap_Fetchers.api_server_check.replace(Erddap_Fetchers.api_server, OPTIONS['erddap'])
+        Erddap_Fetchers.api_server = OPTIONS['erddap']
+
+        sources["erddap"] = Erddap_Fetchers
+    except Exception:
+        warnings.warn(
+            "An error occurred while loading the ERDDAP index fetcher, "
+            "it will not be available !\n%s\n%s"
+            % (sys.exc_info()[0], sys.exc_info()[1])
+        )
+        pass
+
+    try:
+        from ..data_fetchers import gdacftp_index as GDAC_Fetchers
+        # Ensure we're loading the gdac data fetcher with the current options:
+        GDAC_Fetchers.api_server_check = OPTIONS['ftp']
+        GDAC_Fetchers.api_server = OPTIONS['ftp']
+
+        sources["gdac"] = GDAC_Fetchers
+    except Exception:
+        warnings.warn(
+            "An error occurred while loading the GDAC index fetcher, "
+            "it will not be available !\n%s\n%s"
+            % (sys.exc_info()[0], sys.exc_info()[1])
+        )
+        pass
+
+    return sources
+
+
+def list_standard_variables():
+    """ List of variables for standard users """
+    return [
+        "DATA_MODE",
+        "LATITUDE",
+        "LONGITUDE",
+        "POSITION_QC",
+        "DIRECTION",
+        "PLATFORM_NUMBER",
+        "CYCLE_NUMBER",
+        "PRES",
+        "TEMP",
+        "PSAL",
+        "PRES_QC",
+        "TEMP_QC",
+        "PSAL_QC",
+        "PRES_ADJUSTED",
+        "TEMP_ADJUSTED",
+        "PSAL_ADJUSTED",
+        "PRES_ADJUSTED_QC",
+        "TEMP_ADJUSTED_QC",
+        "PSAL_ADJUSTED_QC",
+        "PRES_ADJUSTED_ERROR",
+        "TEMP_ADJUSTED_ERROR",
+        "PSAL_ADJUSTED_ERROR",
+        "PRES_ERROR",  # can be created from PRES_ADJUSTED_ERROR after a filter_data_mode
+        "TEMP_ERROR",
+        "PSAL_ERROR",
+        "JULD",
+        "JULD_QC",
+        "TIME",
+        "TIME_QC",
+        # "CONFIG_MISSION_NUMBER",
+    ]
+
+
+def list_multiprofile_file_variables():
+    """ List of variables in a netcdf multiprofile file.
+
+        This is for files created by GDAC under <DAC>/<WMO>/<WMO>_prof.nc
+    """
+    return [
+        "CONFIG_MISSION_NUMBER",
+        "CYCLE_NUMBER",
+        "DATA_CENTRE",
+        "DATA_MODE",
+        "DATA_STATE_INDICATOR",
+        "DATA_TYPE",
+        "DATE_CREATION",
+        "DATE_UPDATE",
+        "DC_REFERENCE",
+        "DIRECTION",
+        "FIRMWARE_VERSION",
+        "FLOAT_SERIAL_NO",
+        "FORMAT_VERSION",
+        "HANDBOOK_VERSION",
+        "HISTORY_ACTION",
+        "HISTORY_DATE",
+        "HISTORY_INSTITUTION",
+        "HISTORY_PARAMETER",
+        "HISTORY_PREVIOUS_VALUE",
+        "HISTORY_QCTEST",
+        "HISTORY_REFERENCE",
+        "HISTORY_SOFTWARE",
+        "HISTORY_SOFTWARE_RELEASE",
+        "HISTORY_START_PRES",
+        "HISTORY_STEP",
+        "HISTORY_STOP_PRES",
+        "JULD",
+        "JULD_LOCATION",
+        "JULD_QC",
+        "LATITUDE",
+        "LONGITUDE",
+        "PARAMETER",
+        "PI_NAME",
+        "PLATFORM_NUMBER",
+        "PLATFORM_TYPE",
+        "POSITIONING_SYSTEM",
+        "POSITION_QC",
+        "PRES",
+        "PRES_ADJUSTED",
+        "PRES_ADJUSTED_ERROR",
+        "PRES_ADJUSTED_QC",
+        "PRES_QC",
+        "PROFILE_PRES_QC",
+        "PROFILE_PSAL_QC",
+        "PROFILE_TEMP_QC",
+        "PROJECT_NAME",
+        "PSAL",
+        "PSAL_ADJUSTED",
+        "PSAL_ADJUSTED_ERROR",
+        "PSAL_ADJUSTED_QC",
+        "PSAL_QC",
+        "REFERENCE_DATE_TIME",
+        "SCIENTIFIC_CALIB_COEFFICIENT",
+        "SCIENTIFIC_CALIB_COMMENT",
+        "SCIENTIFIC_CALIB_DATE",
+        "SCIENTIFIC_CALIB_EQUATION",
+        "STATION_PARAMETERS",
+        "TEMP",
+        "TEMP_ADJUSTED",
+        "TEMP_ADJUSTED_ERROR",
+        "TEMP_ADJUSTED_QC",
+        "TEMP_QC",
+        "VERTICAL_SAMPLING_SCHEME",
+        "WMO_INST_TYPE",
+    ]
+
diff --git a/argopy/xarray.py b/argopy/xarray.py
index 87ceddef..1ccc8f99 100644
--- a/argopy/xarray.py
+++ b/argopy/xarray.py
@@ -14,16 +14,20 @@
 except ModuleNotFoundError:
     with_gsw = False
 
-from argopy.utilities import (
+from .utilities import (
     linear_interpolation_remap,
-    is_list_of_strings,
     toYearFraction,
     groupby_remap,
+    # log_argopy_callerstack,
+)
+
+from .utils import (
+    is_list_of_strings,
+    # is_list_equal,
     cast_Argo_variable_type,
     DATA_TYPES,
-    # log_argopy_callerstack,
 )
-from argopy.errors import InvalidDatasetStructure, DataNotFound, OptionValueError
+from .errors import InvalidDatasetStructure, DataNotFound, OptionValueError
 
 
 log = logging.getLogger("argopy.xarray")

From 9ac43a2ff695467edeb3315314d33ee859e1e959 Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Fri, 8 Sep 2023 14:16:39 +0200
Subject: [PATCH 15/33] [skip-ci]

---
 argopy/data_fetchers/erddap_index.py  |   7 +-
 argopy/data_fetchers/gdacftp_index.py |  15 ---
 argopy/related/__init__.py            |   6 +-
 argopy/related/utils.py               |  42 ++++++
 argopy/stores/argo_index_proto.py     |   2 +-
 argopy/tests/test_related.py          |  15 ++-
 argopy/tests/test_utilities.py        |  57 --------
 argopy/tests/test_utils_checkers.py   |  49 ++++++-
 argopy/tests/test_utils_lists.py      |   7 +
 argopy/utilities.py                   | 181 --------------------------
 argopy/utils/__init__.py              |   3 +
 argopy/utils/checkers.py              | 159 +++++++++++++++++++++-
 12 files changed, 282 insertions(+), 261 deletions(-)
 create mode 100644 argopy/related/utils.py
 create mode 100644 argopy/tests/test_utils_lists.py

diff --git a/argopy/data_fetchers/erddap_index.py b/argopy/data_fetchers/erddap_index.py
index ebaff973..5cf84730 100644
--- a/argopy/data_fetchers/erddap_index.py
+++ b/argopy/data_fetchers/erddap_index.py
@@ -17,9 +17,10 @@
 
 from abc import ABC, abstractmethod
 
-from argopy.utilities import load_dict, mapp_dict, format_oneline
-from argopy.stores import httpstore
-from argopy.options import OPTIONS
+from ..utilities import format_oneline
+from ..related import load_dict, mapp_dict
+from ..stores import httpstore
+from ..options import OPTIONS
 
 log = logging.getLogger("argopy.fetchers.erddap_index")
 
diff --git a/argopy/data_fetchers/gdacftp_index.py b/argopy/data_fetchers/gdacftp_index.py
index c1a117d9..7b11f73d 100644
--- a/argopy/data_fetchers/gdacftp_index.py
+++ b/argopy/data_fetchers/gdacftp_index.py
@@ -161,21 +161,6 @@ def clear_cache(self):
     def to_dataframe(self):
         """ Filter index file and return a pandas dataframe """
         df = self.indexfs.run().to_dataframe()
-
-        # Post-processing of the filtered index is done at the indexstore level
-        # if 'wmo' not in df:
-        #     df['wmo'] = df['file'].apply(lambda x: int(x.split('/')[1]))
-        #
-        # # institution & profiler mapping for all users
-        # # todo: may be we need to separate this for standard and expert users
-        # institution_dictionnary = load_dict('institutions')
-        # df['tmp1'] = df.institution.apply(lambda x: mapp_dict(institution_dictionnary, x))
-        # df = df.rename(columns={"institution": "institution_code", "tmp1": "institution"})
-        #
-        # profiler_dictionnary = load_dict('profilers')
-        # df['profiler'] = df.profiler_type.apply(lambda x: mapp_dict(profiler_dictionnary, int(x)))
-        # df = df.rename(columns={"profiler_type": "profiler_code"})
-
         return df
 
     def to_xarray(self):
diff --git a/argopy/related/__init__.py b/argopy/related/__init__.py
index 5c960c9d..68f16bd7 100644
--- a/argopy/related/__init__.py
+++ b/argopy/related/__init__.py
@@ -4,7 +4,7 @@
 from .argo_documentation import ArgoDocs
 from .doi_snapshot import ArgoDOI
 from .euroargo_api import get_coriolis_profile_id, get_ea_profile_page
-
+from .utils import load_dict, mapp_dict
 
 #
 __all__ = (
@@ -18,4 +18,8 @@
     # Functions:
     "get_coriolis_profile_id",
     "get_ea_profile_page",
+
+    # Utilities:
+    "load_dict",
+    "mapp_dict",
 )
diff --git a/argopy/related/utils.py b/argopy/related/utils.py
new file mode 100644
index 00000000..0463b102
--- /dev/null
+++ b/argopy/related/utils.py
@@ -0,0 +1,42 @@
+import importlib
+import os
+import json
+from . import ArgoNVSReferenceTables
+
+
+path2assets = importlib.util.find_spec('argopy.static.assets').submodule_search_locations[0]
+
+
+def load_dict(ptype):
+    if ptype == "profilers":
+        try:
+            nvs = ArgoNVSReferenceTables(cache=True)
+            profilers = {}
+            for row in nvs.tbl(8).iterrows():
+                profilers.update({int(row[1]['altLabel']): row[1]['prefLabel']})
+            return profilers
+        except Exception:
+            with open(os.path.join(path2assets, "profilers.json"), "rb") as f:
+                loaded_dict = json.load(f)['data']['profilers']
+            return loaded_dict
+    elif ptype == "institutions":
+        try:
+            nvs = ArgoNVSReferenceTables(cache=True)
+            institutions = {}
+            for row in nvs.tbl(4).iterrows():
+                institutions.update({row[1]['altLabel']: row[1]['prefLabel']})
+            return institutions
+        except Exception:
+            with open(os.path.join(path2assets, "institutions.json"), "rb") as f:
+                loaded_dict = json.load(f)['data']['institutions']
+            return loaded_dict
+    else:
+        raise ValueError("Invalid dictionary name")
+
+
+def mapp_dict(Adictionnary, Avalue):
+    if Avalue not in Adictionnary:
+        return "Unknown"
+    else:
+        return Adictionnary[Avalue]
+
diff --git a/argopy/stores/argo_index_proto.py b/argopy/stores/argo_index_proto.py
index f7ed13d0..5a1f629a 100644
--- a/argopy/stores/argo_index_proto.py
+++ b/argopy/stores/argo_index_proto.py
@@ -505,7 +505,7 @@ def get_filename(s, index):
         else:
             log.debug("Converting [%s] to dataframe from scratch ..." % src)
             # Post-processing for user:
-            from argopy.utilities import load_dict, mapp_dict
+            from ..related import load_dict, mapp_dict
 
             if nrows is not None:
                 df = df.loc[0: nrows - 1].copy()
diff --git a/argopy/tests/test_related.py b/argopy/tests/test_related.py
index 82f2028c..81d219d6 100644
--- a/argopy/tests/test_related.py
+++ b/argopy/tests/test_related.py
@@ -19,8 +19,9 @@
     ArgoNVSReferenceTables,
     OceanOPSDeployments,
     ArgoDocs,
+    load_dict, mapp_dict
 )
-from argopy.utilities import (
+from argopy.utils.checkers import (
     is_list_of_strings,
 )
 
@@ -301,3 +302,15 @@ def test_open_pdf(self, page, an_instance):
         else:
             with pytest.raises(ValueError):
                 an_instance.show()
+
+
+
+def test_invalid_dictionnary():
+    with pytest.raises(ValueError):
+        load_dict("invalid_dictionnary")
+
+
+def test_invalid_dictionnary_key():
+    d = load_dict("profilers")
+    assert mapp_dict(d, "invalid_key") == "Unknown"
+
diff --git a/argopy/tests/test_utilities.py b/argopy/tests/test_utilities.py
index 4f691037..cecfb621 100644
--- a/argopy/tests/test_utilities.py
+++ b/argopy/tests/test_utilities.py
@@ -45,28 +45,6 @@
 from mocked_http import mocked_httpserver, mocked_server_address
 
 
-def test_invalid_dictionnary():
-    with pytest.raises(ValueError):
-        load_dict("invalid_dictionnary")
-
-
-def test_invalid_dictionnary_key():
-    d = load_dict("profilers")
-    assert mapp_dict(d, "invalid_key") == "Unknown"
-
-
-def test_list_multiprofile_file_variables():
-    assert is_list_of_strings(list_multiprofile_file_variables())
-
-
-def test_check_gdac_path():
-    assert check_gdac_path("dummy_path", errors='ignore') is False
-    with pytest.raises(FtpPathError):
-        check_gdac_path("dummy_path", errors='raise')
-    with pytest.warns(UserWarning):
-        assert check_gdac_path("dummy_path", errors='warn') is False
-
-
 @pytest.mark.parametrize("conda", [False, True],
                          indirect=False,
                          ids=["conda=%s" % str(p) for p in [False, True]])
@@ -76,41 +54,6 @@ def test_show_versions(conda):
     assert "SYSTEM" in f.getvalue()
 
 
-def test_isconnected(mocked_httpserver):
-    assert isinstance(isconnected(host=mocked_server_address), bool)
-    assert isconnected(host="http://dummyhost") is False
-
-
-def test_urlhaskeyword(mocked_httpserver):
-    url = "https://api.ifremer.fr/argopy/data/ARGO-FULL.json"
-    url.replace("https://api.ifremer.fr", mocked_server_address)
-    assert isinstance(urlhaskeyword(url, "label"), bool)
-
-
-params = [mocked_server_address,
-          {"url": mocked_server_address + "/argopy/data/ARGO-FULL.json", "keyword": "label"}
-          ]
-params_ids = ["url is a %s" % str(type(p)) for p in params]
-@pytest.mark.parametrize("params", params, indirect=False, ids=params_ids)
-def test_isalive(params, mocked_httpserver):
-    assert isinstance(isalive(params), bool)
-
-
-@requires_erddap
-@pytest.mark.parametrize("data", [True, False], indirect=False, ids=["data=%s" % t for t in [True, False]])
-def test_isAPIconnected(data, mocked_httpserver):
-    with argopy.set_options(erddap=mocked_server_address):
-        assert isinstance(isAPIconnected(src="erddap", data=data), bool)
-
-
-def test_erddap_ds_exists(mocked_httpserver):
-    with argopy.set_options(erddap=mocked_server_address):
-        assert isinstance(erddap_ds_exists(ds="ArgoFloats"), bool)
-        assert erddap_ds_exists(ds="DummyDS") is False
-
-# todo : Implement tests for utilities functions: badge, fetch_status and monitor_status
-
-
 @requires_gdac
 def test_clear_cache():
     ftproot, flist = argopy.tutorial.open_dataset("gdac")
diff --git a/argopy/tests/test_utils_checkers.py b/argopy/tests/test_utils_checkers.py
index 5ccc14af..987bd88a 100644
--- a/argopy/tests/test_utils_checkers.py
+++ b/argopy/tests/test_utils_checkers.py
@@ -1,10 +1,15 @@
 import pytest
 import numpy as np
+from mocked_http import mocked_httpserver, mocked_server_address
 
-from argopy.utils import (
+import argopy
+from argopy.errors import FtpPathError
+from argopy.utils.checkers import (
     is_box, is_indexbox,
     check_wmo, is_wmo,
     check_cyc, is_cyc,
+    check_gdac_path,
+    isconnected, urlhaskeyword, isAPIconnected, erddap_ds_exists, isalive
 )
 
 
@@ -177,3 +182,45 @@ def test_check_cyc():
     assert check_cyc([12, 123]) == [12, 123]
     assert check_cyc(np.array((123, 1234), dtype='int')) == [123, 1234]
 
+
+def test_check_gdac_path():
+    assert check_gdac_path("dummy_path", errors='ignore') is False
+    with pytest.raises(FtpPathError):
+        check_gdac_path("dummy_path", errors='raise')
+    with pytest.warns(UserWarning):
+        assert check_gdac_path("dummy_path", errors='warn') is False
+
+
+def test_isconnected(mocked_httpserver):
+    assert isinstance(isconnected(host=mocked_server_address), bool)
+    assert isconnected(host="http://dummyhost") is False
+
+
+def test_urlhaskeyword(mocked_httpserver):
+    url = "https://api.ifremer.fr/argopy/data/ARGO-FULL.json"
+    url.replace("https://api.ifremer.fr", mocked_server_address)
+    assert isinstance(urlhaskeyword(url, "label"), bool)
+
+
+params = [mocked_server_address,
+          {"url": mocked_server_address + "/argopy/data/ARGO-FULL.json", "keyword": "label"}
+          ]
+params_ids = ["url is a %s" % str(type(p)) for p in params]
+@pytest.mark.parametrize("params", params, indirect=False, ids=params_ids)
+def test_isalive(params, mocked_httpserver):
+    assert isinstance(isalive(params), bool)
+
+
+@requires_erddap
+@pytest.mark.parametrize("data", [True, False], indirect=False, ids=["data=%s" % t for t in [True, False]])
+def test_isAPIconnected(data, mocked_httpserver):
+    with argopy.set_options(erddap=mocked_server_address):
+        assert isinstance(isAPIconnected(src="erddap", data=data), bool)
+
+
+def test_erddap_ds_exists(mocked_httpserver):
+    with argopy.set_options(erddap=mocked_server_address):
+        assert isinstance(erddap_ds_exists(ds="ArgoFloats"), bool)
+        assert erddap_ds_exists(ds="DummyDS") is False
+
+# todo : Implement tests for utilities functions: badge, fetch_status and monitor_status
diff --git a/argopy/tests/test_utils_lists.py b/argopy/tests/test_utils_lists.py
new file mode 100644
index 00000000..06aaa893
--- /dev/null
+++ b/argopy/tests/test_utils_lists.py
@@ -0,0 +1,7 @@
+# import pytest
+from argopy.utils.checkers import is_list_of_strings
+from argopy.utils.lists import list_multiprofile_file_variables
+
+
+def test_list_multiprofile_file_variables():
+    assert is_list_of_strings(list_multiprofile_file_variables())
diff --git a/argopy/utilities.py b/argopy/utilities.py
index 955f3250..fd5e0479 100644
--- a/argopy/utilities.py
+++ b/argopy/utilities.py
@@ -193,40 +193,6 @@ def convert_size(size_bytes):
         return pd.DataFrame(listing)
 
 
-def load_dict(ptype):
-    if ptype == "profilers":
-        try:
-            nvs = ArgoNVSReferenceTables(cache=True)
-            profilers = {}
-            for row in nvs.tbl(8).iterrows():
-                profilers.update({int(row[1]['altLabel']): row[1]['prefLabel']})
-            return profilers
-        except Exception:
-            with open(os.path.join(path2assets, "profilers.json"), "rb") as f:
-                loaded_dict = json.load(f)['data']['profilers']
-            return loaded_dict
-    elif ptype == "institutions":
-        try:
-            nvs = ArgoNVSReferenceTables(cache=True)
-            institutions = {}
-            for row in nvs.tbl(4).iterrows():
-                institutions.update({row[1]['altLabel']: row[1]['prefLabel']})
-            return institutions
-        except Exception:
-            with open(os.path.join(path2assets, "institutions.json"), "rb") as f:
-                loaded_dict = json.load(f)['data']['institutions']
-            return loaded_dict
-    else:
-        raise ValueError("Invalid dictionary name")
-
-
-def mapp_dict(Adictionnary, Avalue):
-    if Avalue not in Adictionnary:
-        return "Unknown"
-    else:
-        return Adictionnary[Avalue]
-
-
 def get_sys_info():
     """Returns system information as a dict"""
 
@@ -428,153 +394,6 @@ def show_options(file=sys.stdout):  # noqa: C901
         print(f"{k}: {v}", file=file)
 
 
-
-def isconnected(host: str = "https://www.ifremer.fr", maxtry: int = 10):
-    """Check if an URL is alive
-
-        Parameters
-        ----------
-        host: str
-            URL to use, 'https://www.ifremer.fr' by default
-        maxtry: int, default: 10
-            Maximum number of host connections to try before
-
-        Returns
-        -------
-        bool
-    """
-    # log.debug("isconnected: %s" % host)
-    if split_protocol(host)[0] in ["http", "https", "ftp", "sftp"]:
-        it = 0
-        while it < maxtry:
-            try:
-                # log.debug("Checking if %s is connected ..." % host)
-                urllib.request.urlopen(host, timeout=1)  # nosec B310 because host protocol already checked
-                result, it = True, maxtry
-            except Exception:
-                result, it = False, it + 1
-        return result
-    else:
-        return os.path.exists(host)
-
-
-def urlhaskeyword(url: str = "", keyword: str = '', maxtry: int = 10):
-    """ Check if a keyword is in the content of a URL
-
-        Parameters
-        ----------
-        url: str
-        keyword: str
-        maxtry: int, default: 10
-            Maximum number of host connections to try before returning False
-
-        Returns
-        -------
-        bool
-    """
-    it = 0
-    while it < maxtry:
-        try:
-            with fsspec.open(url) as f:
-                data = f.read()
-            result = keyword in str(data)
-            it = maxtry
-        except Exception:
-            result, it = False, it + 1
-    return result
-
-
-def isalive(api_server_check: Union[str, dict] = "") -> bool:
-    """Check if an API is alive or not
-
-        2 methods are available:
-
-        - URL Ping
-        - keyword Check
-
-        Parameters
-        ----------
-        api_server_check
-            Url string or dictionary with [``url``, ``keyword``] keys.
-
-            - For a string, uses: :class:`argopy.utilities.isconnected`
-            - For a dictionary,  uses: :class:`argopy.utilities.urlhaskeyword`
-
-        Returns
-        -------
-        bool
-    """
-    # log.debug("isalive: %s" % api_server_check)
-    if isinstance(api_server_check, dict):
-        return urlhaskeyword(url=api_server_check['url'], keyword=api_server_check['keyword'])
-    else:
-        return isconnected(api_server_check)
-
-
-def isAPIconnected(src="erddap", data=True):
-    """ Check if a source API is alive or not
-
-        The API is connected when it has a live URL or valid folder path.
-
-        Parameters
-        ----------
-        src: str
-            The data or index source name, 'erddap' default
-        data: bool
-            If True check the data fetcher (default), if False, check the index fetcher
-
-        Returns
-        -------
-        bool
-    """
-    if data:
-        list_src = list_available_data_src()
-    else:
-        list_src = list_available_index_src()
-
-    if src in list_src and getattr(list_src[src], "api_server_check", None):
-        return isalive(list_src[src].api_server_check)
-    else:
-        raise InvalidFetcher
-
-
-def erddap_ds_exists(
-        ds: Union[list, str] = "ArgoFloats",
-        erddap: str = None,
-        maxtry: int = 2
-) -> bool:
-    """ Check if a dataset exists on a remote erddap server
-
-    Parameter
-    ---------
-    ds: str, default='ArgoFloats'
-        Name of the erddap dataset to check
-    erddap: str, default=OPTIONS['erddap']
-        Url of the erddap server
-    maxtry: int, default: 2
-        Maximum number of host connections to try
-
-    Return
-    ------
-    bool
-    """
-    if erddap is None:
-        erddap = OPTIONS['erddap']
-    # log.debug("from erddap_ds_exists: %s" % erddap)
-    from .stores import httpstore
-    if isconnected(erddap, maxtry=maxtry):
-        with httpstore(timeout=OPTIONS['api_timeout']).open("".join([erddap, "/info/index.json"])) as of:
-            erddap_index = json.load(of)
-        if is_list_of_strings(ds):
-            return [this_ds in [row[-1] for row in erddap_index["table"]["rows"]] for this_ds in ds]
-        else:
-            return ds in [row[-1] for row in erddap_index["table"]["rows"]]
-    else:
-        log.debug("Cannot reach erddap server: %s" % erddap)
-        warnings.warn("Return False because we cannot reach the erddap server %s" % erddap)
-        return False
-
-
 def badge(label="label", message="message", color="green", insert=False):
     """ Return or insert shield.io badge image
 
diff --git a/argopy/utils/__init__.py b/argopy/utils/__init__.py
index acdfe1ce..8acfbd69 100644
--- a/argopy/utils/__init__.py
+++ b/argopy/utils/__init__.py
@@ -6,6 +6,8 @@
     is_cyc, check_cyc,
     check_index_cols,
     check_gdac_path,
+    isconnected, urlhaskeyword,
+    isalive, isAPIconnected, erddap_ds_exists,
 )
 from .casting import DATA_TYPES, cast_Argo_variable_type, to_list
 from .decorators import deprecated, doc_inherit
@@ -29,6 +31,7 @@
     "is_cyc", "check_cyc",
     "check_index_cols",
     "check_gdac_path",
+    "isconnected", "isalive", "isAPIconnected", "erddap_ds_exists",
 
     # Data type casting:
     "DATA_TYPES",
diff --git a/argopy/utils/checkers.py b/argopy/utils/checkers.py
index 2c8cfb53..b3f2f977 100644
--- a/argopy/utils/checkers.py
+++ b/argopy/utils/checkers.py
@@ -1,12 +1,24 @@
+import os
 import warnings
 import numpy as np
 import pandas as pd
 import xarray as xr
+from typing import Union
 from fsspec.core import split_protocol
 import fsspec
 from socket import gaierror
+import urllib
+import json
+import logging
+
+from ..options import OPTIONS
+from ..stores import httpstore
 from ..utils import to_list
-from ..errors import InvalidDatasetStructure, FtpPathError
+from ..errors import InvalidDatasetStructure, FtpPathError, InvalidFetcher
+from . import list_available_data_src, list_available_index_src
+
+
+log = logging.getLogger("argopy.utils.checkers")
 
 
 def is_indexbox(box: list, errors="raise"):
@@ -468,3 +480,148 @@ def check_gdac_path(path, errors='ignore'):  # noqa: C901
     else:
         return False
 
+
+def isconnected(host: str = "https://www.ifremer.fr", maxtry: int = 10):
+    """Check if an URL is alive
+
+        Parameters
+        ----------
+        host: str
+            URL to use, 'https://www.ifremer.fr' by default
+        maxtry: int, default: 10
+            Maximum number of host connections to try before
+
+        Returns
+        -------
+        bool
+    """
+    # log.debug("isconnected: %s" % host)
+    if split_protocol(host)[0] in ["http", "https", "ftp", "sftp"]:
+        it = 0
+        while it < maxtry:
+            try:
+                # log.debug("Checking if %s is connected ..." % host)
+                urllib.request.urlopen(host, timeout=1)  # nosec B310 because host protocol already checked
+                result, it = True, maxtry
+            except Exception:
+                result, it = False, it + 1
+        return result
+    else:
+        return os.path.exists(host)
+
+
+def urlhaskeyword(url: str = "", keyword: str = '', maxtry: int = 10):
+    """ Check if a keyword is in the content of a URL
+
+        Parameters
+        ----------
+        url: str
+        keyword: str
+        maxtry: int, default: 10
+            Maximum number of host connections to try before returning False
+
+        Returns
+        -------
+        bool
+    """
+    it = 0
+    while it < maxtry:
+        try:
+            with fsspec.open(url) as f:
+                data = f.read()
+            result = keyword in str(data)
+            it = maxtry
+        except Exception:
+            result, it = False, it + 1
+    return result
+
+
+def isalive(api_server_check: Union[str, dict] = "") -> bool:
+    """Check if an API is alive or not
+
+        2 methods are available:
+
+        - URL Ping
+        - keyword Check
+
+        Parameters
+        ----------
+        api_server_check
+            Url string or dictionary with [``url``, ``keyword``] keys.
+
+            - For a string, uses: :class:`argopy.utilities.isconnected`
+            - For a dictionary,  uses: :class:`argopy.utilities.urlhaskeyword`
+
+        Returns
+        -------
+        bool
+    """
+    # log.debug("isalive: %s" % api_server_check)
+    if isinstance(api_server_check, dict):
+        return urlhaskeyword(url=api_server_check['url'], keyword=api_server_check['keyword'])
+    else:
+        return isconnected(api_server_check)
+
+
+def isAPIconnected(src="erddap", data=True):
+    """ Check if a source API is alive or not
+
+        The API is connected when it has a live URL or valid folder path.
+
+        Parameters
+        ----------
+        src: str
+            The data or index source name, 'erddap' default
+        data: bool
+            If True check the data fetcher (default), if False, check the index fetcher
+
+        Returns
+        -------
+        bool
+    """
+    if data:
+        list_src = list_available_data_src()
+    else:
+        list_src = list_available_index_src()
+
+    if src in list_src and getattr(list_src[src], "api_server_check", None):
+        return isalive(list_src[src].api_server_check)
+    else:
+        raise InvalidFetcher
+
+
+def erddap_ds_exists(
+        ds: Union[list, str] = "ArgoFloats",
+        erddap: str = None,
+        maxtry: int = 2
+) -> bool:
+    """ Check if a dataset exists on a remote erddap server
+
+    Parameter
+    ---------
+    ds: str, default='ArgoFloats'
+        Name of the erddap dataset to check
+    erddap: str, default=OPTIONS['erddap']
+        Url of the erddap server
+    maxtry: int, default: 2
+        Maximum number of host connections to try
+
+    Return
+    ------
+    bool
+    """
+    if erddap is None:
+        erddap = OPTIONS['erddap']
+    # log.debug("from erddap_ds_exists: %s" % erddap)
+    if isconnected(erddap, maxtry=maxtry):
+        with httpstore(timeout=OPTIONS['api_timeout']).open("".join([erddap, "/info/index.json"])) as of:
+            erddap_index = json.load(of)
+        if is_list_of_strings(ds):
+            return [this_ds in [row[-1] for row in erddap_index["table"]["rows"]] for this_ds in ds]
+        else:
+            return ds in [row[-1] for row in erddap_index["table"]["rows"]]
+    else:
+        log.debug("Cannot reach erddap server: %s" % erddap)
+        warnings.warn("Return False because we cannot reach the erddap server %s" % erddap)
+        return False
+

From 33d242388cc0b55b6c77cfd1a2263609b4cc6fa5 Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Fri, 8 Sep 2023 15:20:45 +0200
Subject: [PATCH 16/33] [skip-ci]

---
 argopy/data_fetchers/argovis_data.py   |  11 +-
 argopy/data_fetchers/erddap_data.py    |   7 +-
 argopy/data_fetchers/erddap_refdata.py |   8 +-
 argopy/data_fetchers/gdacftp_data.py   |   2 +-
 argopy/data_fetchers/proto.py          |   2 +-
 argopy/stores/argo_index_proto.py      |   2 +-
 argopy/stores/filesystems.py           |   3 +-
 argopy/tests/test_related.py           |  15 +-
 argopy/tests/test_utilities.py         | 316 ------------
 argopy/tests/test_utils_accessories.py |  86 ++++
 argopy/tests/test_utils_caching.py     |  35 ++
 argopy/tests/test_utils_checkers.py    |   6 +-
 argopy/tests/test_utils_chunking.py    | 196 ++++++++
 argopy/utilities.py                    | 635 -------------------------
 argopy/utils/__init__.py               |  19 +-
 argopy/utils/accessories.py            | 262 ++++++++++
 argopy/utils/caching.py                | 122 +++++
 argopy/utils/chunking.py               | 282 +++++++++++
 18 files changed, 1031 insertions(+), 978 deletions(-)
 create mode 100644 argopy/tests/test_utils_accessories.py
 create mode 100644 argopy/tests/test_utils_caching.py
 create mode 100644 argopy/tests/test_utils_chunking.py
 create mode 100644 argopy/utils/accessories.py
 create mode 100644 argopy/utils/caching.py
 create mode 100644 argopy/utils/chunking.py

diff --git a/argopy/data_fetchers/argovis_data.py b/argopy/data_fetchers/argovis_data.py
index 8bab0bca..f57a22c7 100644
--- a/argopy/data_fetchers/argovis_data.py
+++ b/argopy/data_fetchers/argovis_data.py
@@ -9,14 +9,15 @@
 import xarray as xr
 import getpass
 import logging
-from .proto import ArgoDataFetcherProto
 from abc import abstractmethod
 import warnings
 
-from argopy.stores import httpstore
-from argopy.options import OPTIONS
-from argopy.utilities import format_oneline, Chunker
-from argopy.errors import DataNotFound
+from ..stores import httpstore
+from ..options import OPTIONS
+from ..utilities import format_oneline
+from ..utils import Chunker
+from ..errors import DataNotFound
+from .proto import ArgoDataFetcherProto
 
 
 access_points = ["wmo", "box"]
diff --git a/argopy/data_fetchers/erddap_data.py b/argopy/data_fetchers/erddap_data.py
index c3d3ea58..e817f087 100644
--- a/argopy/data_fetchers/erddap_data.py
+++ b/argopy/data_fetchers/erddap_data.py
@@ -24,13 +24,14 @@
 from aiohttp import ClientResponseError
 import logging
 
-from .proto import ArgoDataFetcherProto
 from ..options import OPTIONS
-from ..utilities import Chunker, format_oneline
+from ..utilities import format_oneline
 from ..stores import httpstore
 from ..errors import ErddapServerError, DataNotFound
 from ..stores import indexstore_pd as ArgoIndex  # make sure we work with the Pandas index store
-from ..utils import is_list_of_strings, to_list
+from ..utils import is_list_of_strings, to_list,Chunker
+from .proto import ArgoDataFetcherProto
+
 
 # Load erddapy according to available version (breaking changes in v0.8.0)
 try:
diff --git a/argopy/data_fetchers/erddap_refdata.py b/argopy/data_fetchers/erddap_refdata.py
index fc0c216a..1b07bf4e 100644
--- a/argopy/data_fetchers/erddap_refdata.py
+++ b/argopy/data_fetchers/erddap_refdata.py
@@ -2,11 +2,11 @@
 Fetcher to retrieve CTD reference data from Ifremer erddap
 """
 import xarray as xr
-from .erddap_data import ErddapArgoDataFetcher
-from argopy.options import OPTIONS
-from argopy.utilities import Chunker
-from argopy.stores import httpstore_erddap_auth
 import logging
+from ..options import OPTIONS
+from ..utils import Chunker
+from ..stores import httpstore_erddap_auth
+from .erddap_data import ErddapArgoDataFetcher
 
 # Load erddapy according to available version (breaking changes in v0.8.0)
 try:
diff --git a/argopy/data_fetchers/gdacftp_data.py b/argopy/data_fetchers/gdacftp_data.py
index 631d31d2..d6ee4599 100644
--- a/argopy/data_fetchers/gdacftp_data.py
+++ b/argopy/data_fetchers/gdacftp_data.py
@@ -12,11 +12,11 @@
 import getpass
 import logging
 
-from .proto import ArgoDataFetcherProto
 from ..utilities import format_oneline, argo_split_path
 from ..options import OPTIONS, check_gdac_path
 from ..errors import DataNotFound
 from ..stores import ArgoIndex
+from .proto import ArgoDataFetcherProto
 
 log = logging.getLogger("argopy.gdacftp.data")
 access_points = ["wmo", "box"]
diff --git a/argopy/data_fetchers/proto.py b/argopy/data_fetchers/proto.py
index 28452de5..a3f0ded1 100644
--- a/argopy/data_fetchers/proto.py
+++ b/argopy/data_fetchers/proto.py
@@ -5,7 +5,7 @@
 import hashlib
 import warnings
 from ..plot import dashboard
-from ..utilities import list_standard_variables
+from ..utils import list_standard_variables
 
 
 class ArgoDataFetcherProto(ABC):
diff --git a/argopy/stores/argo_index_proto.py b/argopy/stores/argo_index_proto.py
index 5a1f629a..48e82180 100644
--- a/argopy/stores/argo_index_proto.py
+++ b/argopy/stores/argo_index_proto.py
@@ -13,7 +13,7 @@
 
 from ..options import OPTIONS
 from ..errors import FtpPathError, InvalidDataset, OptionValueError
-from ..utilities import Registry, isconnected
+from ..utils import Registry, isconnected
 from .filesystems import httpstore, memorystore, filestore, ftpstore
 
 try:
diff --git a/argopy/stores/filesystems.py b/argopy/stores/filesystems.py
index 3e08cd3d..42517f93 100644
--- a/argopy/stores/filesystems.py
+++ b/argopy/stores/filesystems.py
@@ -49,12 +49,11 @@
 )
 from abc import ABC, abstractmethod
 from ..utilities import (
-    Registry,
-    #    log_argopy_callerstack,
     drop_variables_not_in_all_datasets,
     fill_variables_not_in_all_datasets,
 )
 from ..utils import MonitoredThreadPoolExecutor as MyExecutor
+from ..utils import Registry
 
 
 log = logging.getLogger("argopy.stores")
diff --git a/argopy/tests/test_related.py b/argopy/tests/test_related.py
index 81d219d6..031d2710 100644
--- a/argopy/tests/test_related.py
+++ b/argopy/tests/test_related.py
@@ -14,12 +14,14 @@
     has_cartopy,
     has_ipython,
 )
+import argopy
 from argopy.related import (
     TopoFetcher,
     ArgoNVSReferenceTables,
     OceanOPSDeployments,
     ArgoDocs,
-    load_dict, mapp_dict
+    load_dict, mapp_dict,
+    get_coriolis_profile_id, get_ea_profile_page
 )
 from argopy.utils.checkers import (
     is_list_of_strings,
@@ -304,7 +306,6 @@ def test_open_pdf(self, page, an_instance):
                 an_instance.show()
 
 
-
 def test_invalid_dictionnary():
     with pytest.raises(ValueError):
         load_dict("invalid_dictionnary")
@@ -314,3 +315,13 @@ def test_invalid_dictionnary_key():
     d = load_dict("profilers")
     assert mapp_dict(d, "invalid_key") == "Unknown"
 
+
+@pytest.mark.parametrize("params", [[6901929, None], [6901929, 12]], indirect=False, ids=['float', 'profile'])
+def test_get_coriolis_profile_id(params, mocked_httpserver):
+    with argopy.set_options(cachedir=tempfile.mkdtemp()):
+        assert isinstance(get_coriolis_profile_id(params[0], params[1], api_server=mocked_server_address), pd.core.frame.DataFrame)
+
+@pytest.mark.parametrize("params", [[6901929, None], [6901929, 12]], indirect=False, ids=['float', 'profile'])
+def test_get_ea_profile_page(params, mocked_httpserver):
+    with argopy.set_options(cachedir=tempfile.mkdtemp()):
+        assert is_list_of_strings(get_ea_profile_page(params[0], params[1], api_server=mocked_server_address))
diff --git a/argopy/tests/test_utilities.py b/argopy/tests/test_utilities.py
index cecfb621..8ccd8d46 100644
--- a/argopy/tests/test_utilities.py
+++ b/argopy/tests/test_utilities.py
@@ -9,17 +9,7 @@
 
 import argopy
 from argopy.utilities import (
-    load_dict,
-    mapp_dict,
-    list_multiprofile_file_variables,
-    check_gdac_path,
-    isconnected,
-    urlhaskeyword,
-    isalive,
-    isAPIconnected,
-    erddap_ds_exists,
     linear_interpolation_remap,
-    Chunker,
     format_oneline,
     wmo2box,
     modified_environ,
@@ -54,33 +44,6 @@ def test_show_versions(conda):
     assert "SYSTEM" in f.getvalue()
 
 
-@requires_gdac
-def test_clear_cache():
-    ftproot, flist = argopy.tutorial.open_dataset("gdac")
-    with tempfile.TemporaryDirectory() as cachedir:
-        with argopy.set_options(cachedir=cachedir):
-            loader = ArgoDataFetcher(src="gdac", ftp=ftproot, cache=True).profile(2902696, 12)
-            loader.to_xarray()
-            argopy.clear_cache()
-            assert os.path.exists(cachedir) is True
-            assert len(os.listdir(cachedir)) == 0
-
-
-@requires_gdac
-def test_lscache():
-    ftproot, flist = argopy.tutorial.open_dataset("gdac")
-    with tempfile.TemporaryDirectory() as cachedir:
-        with argopy.set_options(cachedir=cachedir):
-            loader = ArgoDataFetcher(src="gdac", ftp=ftproot, cache=True).profile(2902696, 12)
-            loader.to_xarray()
-            result = argopy.utilities.lscache(cache_path=cachedir, prt=True)
-            assert isinstance(result, str)
-
-            result = argopy.utilities.lscache(cache_path=cachedir, prt=False)
-            assert isinstance(result, pd.DataFrame)
-
-
-
 class Test_linear_interpolation_remap:
     @pytest.fixture(autouse=True)
     def create_data(self):
@@ -150,193 +113,6 @@ def test_error_ds(self):
             )
 
 
-class Test_Chunker:
-    @pytest.fixture(autouse=True)
-    def create_data(self):
-        self.WMO = [
-            6902766,
-            6902772,
-            6902914,
-            6902746,
-            6902916,
-            6902915,
-            6902757,
-            6902771,
-        ]
-        self.BOX3d = [0, 20, 40, 60, 0, 1000]
-        self.BOX4d = [0, 20, 40, 60, 0, 1000, "2001-01", "2001-6"]
-
-    def test_InvalidFetcherAccessPoint(self):
-        with pytest.raises(InvalidFetcherAccessPoint):
-            Chunker({"invalid": self.WMO})
-
-    def test_invalid_chunks(self):
-        with pytest.raises(ValueError):
-            Chunker({"box": self.BOX3d}, chunks='toto')
-
-    def test_invalid_chunksize(self):
-        with pytest.raises(ValueError):
-            Chunker({"box": self.BOX3d}, chunksize='toto')
-
-    def test_chunk_wmo(self):
-        C = Chunker({"wmo": self.WMO})
-        assert all(
-            [all(isinstance(x, int) for x in chunk) for chunk in C.fit_transform()]
-        )
-
-        C = Chunker({"wmo": self.WMO}, chunks="auto")
-        assert all(
-            [all(isinstance(x, int) for x in chunk) for chunk in C.fit_transform()]
-        )
-
-        C = Chunker({"wmo": self.WMO}, chunks={"wmo": 1})
-        assert all(
-            [all(isinstance(x, int) for x in chunk) for chunk in C.fit_transform()]
-        )
-        assert len(C.fit_transform()) == 1
-
-        with pytest.raises(ValueError):
-            Chunker({"wmo": self.WMO}, chunks=["wmo", 1])
-
-        C = Chunker({"wmo": self.WMO})
-        assert isinstance(C.this_chunker, types.FunctionType) or isinstance(
-            C.this_chunker, types.MethodType
-        )
-
-    def test_chunk_box3d(self):
-        C = Chunker({"box": self.BOX3d})
-        assert all([is_box(chunk) for chunk in C.fit_transform()])
-
-        C = Chunker({"box": self.BOX3d}, chunks="auto")
-        assert all([is_box(chunk) for chunk in C.fit_transform()])
-
-        C = Chunker({"box": self.BOX3d}, chunks={"lon": 12, "lat": 1, "dpt": 1})
-        assert all([is_box(chunk) for chunk in C.fit_transform()])
-        assert len(C.fit_transform()) == 12
-
-        C = Chunker(
-            {"box": self.BOX3d}, chunks={"lat": 1, "dpt": 1}, chunksize={"lon": 10}
-        )
-        chunks = C.fit_transform()
-        assert all([is_box(chunk) for chunk in chunks])
-        assert chunks[0][1] - chunks[0][0] == 10
-
-        C = Chunker({"box": self.BOX3d}, chunks={"lon": 1, "lat": 12, "dpt": 1})
-        assert all([is_box(chunk) for chunk in C.fit_transform()])
-        assert len(C.fit_transform()) == 12
-
-        C = Chunker(
-            {"box": self.BOX3d}, chunks={"lon": 1, "dpt": 1}, chunksize={"lat": 10}
-        )
-        chunks = C.fit_transform()
-        assert all([is_box(chunk) for chunk in chunks])
-        assert chunks[0][3] - chunks[0][2] == 10
-
-        C = Chunker({"box": self.BOX3d}, chunks={"lon": 1, "lat": 1, "dpt": 12})
-        assert all([is_box(chunk) for chunk in C.fit_transform()])
-        assert len(C.fit_transform()) == 12
-
-        C = Chunker(
-            {"box": self.BOX3d}, chunks={"lon": 1, "lat": 1}, chunksize={"dpt": 10}
-        )
-        chunks = C.fit_transform()
-        assert all([is_box(chunk) for chunk in chunks])
-        assert chunks[0][5] - chunks[0][4] == 10
-
-        C = Chunker({"box": self.BOX3d}, chunks={"lon": 4, "lat": 2, "dpt": 1})
-        assert all([is_box(chunk) for chunk in C.fit_transform()])
-        assert len(C.fit_transform()) == 2 * 4
-
-        C = Chunker({"box": self.BOX3d}, chunks={"lon": 2, "lat": 3, "dpt": 4})
-        assert all([is_box(chunk) for chunk in C.fit_transform()])
-        assert len(C.fit_transform()) == 2 * 3 * 4
-
-        with pytest.raises(ValueError):
-            Chunker({"box": self.BOX3d}, chunks=["lon", 1])
-
-        C = Chunker({"box": self.BOX3d})
-        assert isinstance(C.this_chunker, types.FunctionType) or isinstance(
-            C.this_chunker, types.MethodType
-        )
-
-    def test_chunk_box4d(self):
-        C = Chunker({"box": self.BOX4d})
-        assert all([is_box(chunk) for chunk in C.fit_transform()])
-
-        C = Chunker({"box": self.BOX4d}, chunks="auto")
-        assert all([is_box(chunk) for chunk in C.fit_transform()])
-
-        C = Chunker(
-            {"box": self.BOX4d}, chunks={"lon": 2, "lat": 1, "dpt": 1, "time": 1}
-        )
-        assert all([is_box(chunk) for chunk in C.fit_transform()])
-        assert len(C.fit_transform()) == 2
-
-        C = Chunker(
-            {"box": self.BOX4d},
-            chunks={"lat": 1, "dpt": 1, "time": 1},
-            chunksize={"lon": 10},
-        )
-        chunks = C.fit_transform()
-        assert all([is_box(chunk) for chunk in chunks])
-        assert chunks[0][1] - chunks[0][0] == 10
-
-        C = Chunker(
-            {"box": self.BOX4d}, chunks={"lon": 1, "lat": 2, "dpt": 1, "time": 1}
-        )
-        assert all([is_box(chunk) for chunk in C.fit_transform()])
-        assert len(C.fit_transform()) == 2
-
-        C = Chunker(
-            {"box": self.BOX4d},
-            chunks={"lon": 1, "dpt": 1, "time": 1},
-            chunksize={"lat": 10},
-        )
-        chunks = C.fit_transform()
-        assert all([is_box(chunk) for chunk in chunks])
-        assert chunks[0][3] - chunks[0][2] == 10
-
-        C = Chunker(
-            {"box": self.BOX4d}, chunks={"lon": 1, "lat": 1, "dpt": 2, "time": 1}
-        )
-        assert all([is_box(chunk) for chunk in C.fit_transform()])
-        assert len(C.fit_transform()) == 2
-
-        C = Chunker(
-            {"box": self.BOX4d},
-            chunks={"lon": 1, "lat": 1, "time": 1},
-            chunksize={"dpt": 10},
-        )
-        chunks = C.fit_transform()
-        assert all([is_box(chunk) for chunk in chunks])
-        assert chunks[0][5] - chunks[0][4] == 10
-
-        C = Chunker(
-            {"box": self.BOX4d}, chunks={"lon": 1, "lat": 1, "dpt": 1, "time": 2}
-        )
-        assert all([is_box(chunk) for chunk in C.fit_transform()])
-        assert len(C.fit_transform()) == 2
-
-        C = Chunker(
-            {"box": self.BOX4d},
-            chunks={"lon": 1, "lat": 1, "dpt": 1},
-            chunksize={"time": 5},
-        )
-        chunks = C.fit_transform()
-        assert all([is_box(chunk) for chunk in chunks])
-        assert np.timedelta64(
-            pd.to_datetime(chunks[0][7]) - pd.to_datetime(chunks[0][6]), "D"
-        ) <= np.timedelta64(5, "D")
-
-        with pytest.raises(ValueError):
-            Chunker({"box": self.BOX4d}, chunks=["lon", 1])
-
-        C = Chunker({"box": self.BOX4d})
-        assert isinstance(C.this_chunker, types.FunctionType) or isinstance(
-            C.this_chunker, types.MethodType
-        )
-
-
 def test_format_oneline():
     s = "Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do eiusmod tempor incididunt ut labore et dolore"
     assert isinstance(format_oneline(s), str)
@@ -438,95 +214,3 @@ def test_argo_split_path(self, file):
             assert key in desc
 
 
-class Test_float_wmo():
-
-    def test_init(self):
-        assert isinstance(float_wmo(2901746), float_wmo)
-        assert isinstance(float_wmo(float_wmo(2901746)), float_wmo)
-
-    def test_isvalid(self):
-        assert float_wmo(2901746).isvalid
-        assert not float_wmo(12, errors='ignore').isvalid
-
-    def test_ppt(self):
-        assert isinstance(str(float_wmo(2901746)), str)
-        assert isinstance(repr(float_wmo(2901746)), str)
-
-    def test_comparisons(self):
-        assert float_wmo(2901746) == float_wmo(2901746)
-        assert float_wmo(2901746) != float_wmo(2901745)
-        assert float_wmo(2901746) >= float_wmo(2901746)
-        assert float_wmo(2901746) > float_wmo(2901745)
-        assert float_wmo(2901746) <= float_wmo(2901746)
-        assert float_wmo(2901746) < float_wmo(2901747)
-
-    def test_hashable(self):
-        assert isinstance(hash(float_wmo(2901746)), int)
-
-
-class Test_Registry():
-
-    opts = [(None, 'str'), (['hello', 'world'], str), (None, float_wmo), ([2901746, 4902252], float_wmo)]
-    opts_ids = ["%s, %s" % ((lambda x: 'iterlist' if x is not None else x)(opt[0]), repr(opt[1])) for opt in opts]
-
-    @pytest.mark.parametrize("opts", opts, indirect=False, ids=opts_ids)
-    def test_init(self, opts):
-        assert isinstance(Registry(opts[0], dtype=opts[1]), Registry)
-
-    opts = [(['hello', 'world'], str), ([2901746, 4902252], float_wmo)]
-    opts_ids = ["%s, %s" % ((lambda x: 'iterlist' if x is not None else x)(opt[0]), repr(opt[1])) for opt in opts]
-
-    @pytest.mark.parametrize("opts", opts, indirect=False, ids=opts_ids)
-    def test_commit(self, opts):
-        R = Registry(dtype=opts[1])
-        R.commit(opts[0])
-
-    @pytest.mark.parametrize("opts", opts, indirect=False, ids=opts_ids)
-    def test_append(self, opts):
-        R = Registry(dtype=opts[1])
-        R.append(opts[0][0])
-
-    @pytest.mark.parametrize("opts", opts, indirect=False, ids=opts_ids)
-    def test_extend(self, opts):
-        R = Registry(dtype=opts[1])
-        R.append(opts[0])
-
-    @pytest.mark.parametrize("opts", opts, indirect=False, ids=opts_ids)
-    def test_insert(self, opts):
-        R = Registry(opts[0][0], dtype=opts[1])
-        R.insert(0, opts[0][-1])
-        assert R[0] == opts[0][-1]
-
-    @pytest.mark.parametrize("opts", opts, indirect=False, ids=opts_ids)
-    def test_remove(self, opts):
-        R = Registry(opts[0], dtype=opts[1])
-        R.remove(opts[0][0])
-        assert opts[0][0] not in R
-
-    @pytest.mark.parametrize("opts", opts, indirect=False, ids=opts_ids)
-    def test_copy(self, opts):
-        R = Registry(opts[0], dtype=opts[1])
-        assert R == R.copy()
-
-    bad_opts = [(['hello', 12], str), ([2901746, 1], float_wmo)]
-    bad_opts_ids = ["%s, %s" % ((lambda x: 'iterlist' if x is not None else x)(opt[0]), repr(opt[1])) for opt in opts]
-
-    @pytest.mark.parametrize("opts", bad_opts, indirect=False, ids=bad_opts_ids)
-    def test_invalid_dtype(self, opts):
-        with pytest.raises(ValueError):
-            Registry(opts[0][0], dtype=opts[1], invalid='raise').commit(opts[0][-1])
-        with pytest.warns(UserWarning):
-            Registry(opts[0][0], dtype=opts[1], invalid='warn').commit(opts[0][-1])
-        # Raise nothing:
-        Registry(opts[0][0], dtype=opts[1], invalid='ignore').commit(opts[0][-1])
-
-
-@pytest.mark.parametrize("params", [[6901929, None], [6901929, 12]], indirect=False, ids=['float', 'profile'])
-def test_get_coriolis_profile_id(params, mocked_httpserver):
-    with argopy.set_options(cachedir=tempfile.mkdtemp()):
-        assert isinstance(get_coriolis_profile_id(params[0], params[1], api_server=mocked_server_address), pd.core.frame.DataFrame)
-
-@pytest.mark.parametrize("params", [[6901929, None], [6901929, 12]], indirect=False, ids=['float', 'profile'])
-def test_get_ea_profile_page(params, mocked_httpserver):
-    with argopy.set_options(cachedir=tempfile.mkdtemp()):
-        assert is_list_of_strings(get_ea_profile_page(params[0], params[1], api_server=mocked_server_address))
diff --git a/argopy/tests/test_utils_accessories.py b/argopy/tests/test_utils_accessories.py
new file mode 100644
index 00000000..f786d8c1
--- /dev/null
+++ b/argopy/tests/test_utils_accessories.py
@@ -0,0 +1,86 @@
+import pytest
+from argopy.utils.accessories import float_wmo, Registry
+
+
+class Test_float_wmo():
+
+    def test_init(self):
+        assert isinstance(float_wmo(2901746), float_wmo)
+        assert isinstance(float_wmo(float_wmo(2901746)), float_wmo)
+
+    def test_isvalid(self):
+        assert float_wmo(2901746).isvalid
+        assert not float_wmo(12, errors='ignore').isvalid
+
+    def test_ppt(self):
+        assert isinstance(str(float_wmo(2901746)), str)
+        assert isinstance(repr(float_wmo(2901746)), str)
+
+    def test_comparisons(self):
+        assert float_wmo(2901746) == float_wmo(2901746)
+        assert float_wmo(2901746) != float_wmo(2901745)
+        assert float_wmo(2901746) >= float_wmo(2901746)
+        assert float_wmo(2901746) > float_wmo(2901745)
+        assert float_wmo(2901746) <= float_wmo(2901746)
+        assert float_wmo(2901746) < float_wmo(2901747)
+
+    def test_hashable(self):
+        assert isinstance(hash(float_wmo(2901746)), int)
+
+
+class Test_Registry():
+
+    opts = [(None, 'str'), (['hello', 'world'], str), (None, float_wmo), ([2901746, 4902252], float_wmo)]
+    opts_ids = ["%s, %s" % ((lambda x: 'iterlist' if x is not None else x)(opt[0]), repr(opt[1])) for opt in opts]
+
+    @pytest.mark.parametrize("opts", opts, indirect=False, ids=opts_ids)
+    def test_init(self, opts):
+        assert isinstance(Registry(opts[0], dtype=opts[1]), Registry)
+
+    opts = [(['hello', 'world'], str), ([2901746, 4902252], float_wmo)]
+    opts_ids = ["%s, %s" % ((lambda x: 'iterlist' if x is not None else x)(opt[0]), repr(opt[1])) for opt in opts]
+
+    @pytest.mark.parametrize("opts", opts, indirect=False, ids=opts_ids)
+    def test_commit(self, opts):
+        R = Registry(dtype=opts[1])
+        R.commit(opts[0])
+
+    @pytest.mark.parametrize("opts", opts, indirect=False, ids=opts_ids)
+    def test_append(self, opts):
+        R = Registry(dtype=opts[1])
+        R.append(opts[0][0])
+
+    @pytest.mark.parametrize("opts", opts, indirect=False, ids=opts_ids)
+    def test_extend(self, opts):
+        R = Registry(dtype=opts[1])
+        R.append(opts[0])
+
+    @pytest.mark.parametrize("opts", opts, indirect=False, ids=opts_ids)
+    def test_insert(self, opts):
+        R = Registry(opts[0][0], dtype=opts[1])
+        R.insert(0, opts[0][-1])
+        assert R[0] == opts[0][-1]
+
+    @pytest.mark.parametrize("opts", opts, indirect=False, ids=opts_ids)
+    def test_remove(self, opts):
+        R = Registry(opts[0], dtype=opts[1])
+        R.remove(opts[0][0])
+        assert opts[0][0] not in R
+
+    @pytest.mark.parametrize("opts", opts, indirect=False, ids=opts_ids)
+    def test_copy(self, opts):
+        R = Registry(opts[0], dtype=opts[1])
+        assert R == R.copy()
+
+    bad_opts = [(['hello', 12], str), ([2901746, 1], float_wmo)]
+    bad_opts_ids = ["%s, %s" % ((lambda x: 'iterlist' if x is not None else x)(opt[0]), repr(opt[1])) for opt in opts]
+
+    @pytest.mark.parametrize("opts", bad_opts, indirect=False, ids=bad_opts_ids)
+    def test_invalid_dtype(self, opts):
+        with pytest.raises(ValueError):
+            Registry(opts[0][0], dtype=opts[1], invalid='raise').commit(opts[0][-1])
+        with pytest.warns(UserWarning):
+            Registry(opts[0][0], dtype=opts[1], invalid='warn').commit(opts[0][-1])
+        # Raise nothing:
+        Registry(opts[0][0], dtype=opts[1], invalid='ignore').commit(opts[0][-1])
+
diff --git a/argopy/tests/test_utils_caching.py b/argopy/tests/test_utils_caching.py
new file mode 100644
index 00000000..59472072
--- /dev/null
+++ b/argopy/tests/test_utils_caching.py
@@ -0,0 +1,35 @@
+import os
+import pandas as pd
+import argopy
+from argopy import DataFetcher as ArgoDataFetcher
+from utils import (
+    requires_gdac,
+)
+import tempfile
+
+
+@requires_gdac
+def test_clear_cache():
+    ftproot, flist = argopy.tutorial.open_dataset("gdac")
+    with tempfile.TemporaryDirectory() as cachedir:
+        with argopy.set_options(cachedir=cachedir):
+            loader = ArgoDataFetcher(src="gdac", ftp=ftproot, cache=True).profile(2902696, 12)
+            loader.to_xarray()
+            argopy.clear_cache()
+            assert os.path.exists(cachedir) is True
+            assert len(os.listdir(cachedir)) == 0
+
+
+@requires_gdac
+def test_lscache():
+    ftproot, flist = argopy.tutorial.open_dataset("gdac")
+    with tempfile.TemporaryDirectory() as cachedir:
+        with argopy.set_options(cachedir=cachedir):
+            loader = ArgoDataFetcher(src="gdac", ftp=ftproot, cache=True).profile(2902696, 12)
+            loader.to_xarray()
+            result = argopy.utilities.lscache(cache_path=cachedir, prt=True)
+            assert isinstance(result, str)
+
+            result = argopy.utilities.lscache(cache_path=cachedir, prt=False)
+            assert isinstance(result, pd.DataFrame)
+
diff --git a/argopy/tests/test_utils_checkers.py b/argopy/tests/test_utils_checkers.py
index 987bd88a..b8c2d53d 100644
--- a/argopy/tests/test_utils_checkers.py
+++ b/argopy/tests/test_utils_checkers.py
@@ -1,7 +1,9 @@
 import pytest
 import numpy as np
 from mocked_http import mocked_httpserver, mocked_server_address
-
+from utils import (
+    requires_erddap,
+)
 import argopy
 from argopy.errors import FtpPathError
 from argopy.utils.checkers import (
@@ -222,5 +224,3 @@ def test_erddap_ds_exists(mocked_httpserver):
     with argopy.set_options(erddap=mocked_server_address):
         assert isinstance(erddap_ds_exists(ds="ArgoFloats"), bool)
         assert erddap_ds_exists(ds="DummyDS") is False
-
-# todo : Implement tests for utilities functions: badge, fetch_status and monitor_status
diff --git a/argopy/tests/test_utils_chunking.py b/argopy/tests/test_utils_chunking.py
new file mode 100644
index 00000000..3aee8c86
--- /dev/null
+++ b/argopy/tests/test_utils_chunking.py
@@ -0,0 +1,196 @@
+import pytest
+import types
+import numpy as np
+import pandas as pd
+
+from argopy.errors import InvalidFetcherAccessPoint
+from argopy.utils.chunking import Chunker
+from argopy.utils.checkers import is_box
+
+
+class Test_Chunker:
+    @pytest.fixture(autouse=True)
+    def create_data(self):
+        self.WMO = [
+            6902766,
+            6902772,
+            6902914,
+            6902746,
+            6902916,
+            6902915,
+            6902757,
+            6902771,
+        ]
+        self.BOX3d = [0, 20, 40, 60, 0, 1000]
+        self.BOX4d = [0, 20, 40, 60, 0, 1000, "2001-01", "2001-6"]
+
+    def test_InvalidFetcherAccessPoint(self):
+        with pytest.raises(InvalidFetcherAccessPoint):
+            Chunker({"invalid": self.WMO})
+
+    def test_invalid_chunks(self):
+        with pytest.raises(ValueError):
+            Chunker({"box": self.BOX3d}, chunks='toto')
+
+    def test_invalid_chunksize(self):
+        with pytest.raises(ValueError):
+            Chunker({"box": self.BOX3d}, chunksize='toto')
+
+    def test_chunk_wmo(self):
+        C = Chunker({"wmo": self.WMO})
+        assert all(
+            [all(isinstance(x, int) for x in chunk) for chunk in C.fit_transform()]
+        )
+
+        C = Chunker({"wmo": self.WMO}, chunks="auto")
+        assert all(
+            [all(isinstance(x, int) for x in chunk) for chunk in C.fit_transform()]
+        )
+
+        C = Chunker({"wmo": self.WMO}, chunks={"wmo": 1})
+        assert all(
+            [all(isinstance(x, int) for x in chunk) for chunk in C.fit_transform()]
+        )
+        assert len(C.fit_transform()) == 1
+
+        with pytest.raises(ValueError):
+            Chunker({"wmo": self.WMO}, chunks=["wmo", 1])
+
+        C = Chunker({"wmo": self.WMO})
+        assert isinstance(C.this_chunker, types.FunctionType) or isinstance(
+            C.this_chunker, types.MethodType
+        )
+
+    def test_chunk_box3d(self):
+        C = Chunker({"box": self.BOX3d})
+        assert all([is_box(chunk) for chunk in C.fit_transform()])
+
+        C = Chunker({"box": self.BOX3d}, chunks="auto")
+        assert all([is_box(chunk) for chunk in C.fit_transform()])
+
+        C = Chunker({"box": self.BOX3d}, chunks={"lon": 12, "lat": 1, "dpt": 1})
+        assert all([is_box(chunk) for chunk in C.fit_transform()])
+        assert len(C.fit_transform()) == 12
+
+        C = Chunker(
+            {"box": self.BOX3d}, chunks={"lat": 1, "dpt": 1}, chunksize={"lon": 10}
+        )
+        chunks = C.fit_transform()
+        assert all([is_box(chunk) for chunk in chunks])
+        assert chunks[0][1] - chunks[0][0] == 10
+
+        C = Chunker({"box": self.BOX3d}, chunks={"lon": 1, "lat": 12, "dpt": 1})
+        assert all([is_box(chunk) for chunk in C.fit_transform()])
+        assert len(C.fit_transform()) == 12
+
+        C = Chunker(
+            {"box": self.BOX3d}, chunks={"lon": 1, "dpt": 1}, chunksize={"lat": 10}
+        )
+        chunks = C.fit_transform()
+        assert all([is_box(chunk) for chunk in chunks])
+        assert chunks[0][3] - chunks[0][2] == 10
+
+        C = Chunker({"box": self.BOX3d}, chunks={"lon": 1, "lat": 1, "dpt": 12})
+        assert all([is_box(chunk) for chunk in C.fit_transform()])
+        assert len(C.fit_transform()) == 12
+
+        C = Chunker(
+            {"box": self.BOX3d}, chunks={"lon": 1, "lat": 1}, chunksize={"dpt": 10}
+        )
+        chunks = C.fit_transform()
+        assert all([is_box(chunk) for chunk in chunks])
+        assert chunks[0][5] - chunks[0][4] == 10
+
+        C = Chunker({"box": self.BOX3d}, chunks={"lon": 4, "lat": 2, "dpt": 1})
+        assert all([is_box(chunk) for chunk in C.fit_transform()])
+        assert len(C.fit_transform()) == 2 * 4
+
+        C = Chunker({"box": self.BOX3d}, chunks={"lon": 2, "lat": 3, "dpt": 4})
+        assert all([is_box(chunk) for chunk in C.fit_transform()])
+        assert len(C.fit_transform()) == 2 * 3 * 4
+
+        with pytest.raises(ValueError):
+            Chunker({"box": self.BOX3d}, chunks=["lon", 1])
+
+        C = Chunker({"box": self.BOX3d})
+        assert isinstance(C.this_chunker, types.FunctionType) or isinstance(
+            C.this_chunker, types.MethodType
+        )
+
+    def test_chunk_box4d(self):
+        C = Chunker({"box": self.BOX4d})
+        assert all([is_box(chunk) for chunk in C.fit_transform()])
+
+        C = Chunker({"box": self.BOX4d}, chunks="auto")
+        assert all([is_box(chunk) for chunk in C.fit_transform()])
+
+        C = Chunker(
+            {"box": self.BOX4d}, chunks={"lon": 2, "lat": 1, "dpt": 1, "time": 1}
+        )
+        assert all([is_box(chunk) for chunk in C.fit_transform()])
+        assert len(C.fit_transform()) == 2
+
+        C = Chunker(
+            {"box": self.BOX4d},
+            chunks={"lat": 1, "dpt": 1, "time": 1},
+            chunksize={"lon": 10},
+        )
+        chunks = C.fit_transform()
+        assert all([is_box(chunk) for chunk in chunks])
+        assert chunks[0][1] - chunks[0][0] == 10
+
+        C = Chunker(
+            {"box": self.BOX4d}, chunks={"lon": 1, "lat": 2, "dpt": 1, "time": 1}
+        )
+        assert all([is_box(chunk) for chunk in C.fit_transform()])
+        assert len(C.fit_transform()) == 2
+
+        C = Chunker(
+            {"box": self.BOX4d},
+            chunks={"lon": 1, "dpt": 1, "time": 1},
+            chunksize={"lat": 10},
+        )
+        chunks = C.fit_transform()
+        assert all([is_box(chunk) for chunk in chunks])
+        assert chunks[0][3] - chunks[0][2] == 10
+
+        C = Chunker(
+            {"box": self.BOX4d}, chunks={"lon": 1, "lat": 1, "dpt": 2, "time": 1}
+        )
+        assert all([is_box(chunk) for chunk in C.fit_transform()])
+        assert len(C.fit_transform()) == 2
+
+        C = Chunker(
+            {"box": self.BOX4d},
+            chunks={"lon": 1, "lat": 1, "time": 1},
+            chunksize={"dpt": 10},
+        )
+        chunks = C.fit_transform()
+        assert all([is_box(chunk) for chunk in chunks])
+        assert chunks[0][5] - chunks[0][4] == 10
+
+        C = Chunker(
+            {"box": self.BOX4d}, chunks={"lon": 1, "lat": 1, "dpt": 1, "time": 2}
+        )
+        assert all([is_box(chunk) for chunk in C.fit_transform()])
+        assert len(C.fit_transform()) == 2
+
+        C = Chunker(
+            {"box": self.BOX4d},
+            chunks={"lon": 1, "lat": 1, "dpt": 1},
+            chunksize={"time": 5},
+        )
+        chunks = C.fit_transform()
+        assert all([is_box(chunk) for chunk in chunks])
+        assert np.timedelta64(
+            pd.to_datetime(chunks[0][7]) - pd.to_datetime(chunks[0][6]), "D"
+        ) <= np.timedelta64(5, "D")
+
+        with pytest.raises(ValueError):
+            Chunker({"box": self.BOX4d}, chunks=["lon", 1])
+
+        C = Chunker({"box": self.BOX4d})
+        assert isinstance(C.this_chunker, types.FunctionType) or isinstance(
+            C.this_chunker, types.MethodType
+        )
+
diff --git a/argopy/utilities.py b/argopy/utilities.py
index fd5e0479..2a8cf81a 100644
--- a/argopy/utilities.py
+++ b/argopy/utilities.py
@@ -12,12 +12,10 @@
 import urllib
 import json
 import collections
-from collections import UserList
 import copy
 from functools import reduce, wraps
 from packaging import version
 import logging
-from abc import ABC, abstractmethod
 from urllib.parse import urlparse
 from typing import Union
 import inspect
@@ -82,117 +80,6 @@
 log = logging.getLogger("argopy.utilities")
 
 
-def clear_cache(fs=None):
-    """ Delete argopy cache folder content """
-    if os.path.exists(OPTIONS["cachedir"]):
-        # shutil.rmtree(OPTIONS["cachedir"])
-        for filename in os.listdir(OPTIONS["cachedir"]):
-            file_path = os.path.join(OPTIONS["cachedir"], filename)
-            try:
-                if os.path.isfile(file_path) or os.path.islink(file_path):
-                    os.unlink(file_path)
-                elif os.path.isdir(file_path):
-                    shutil.rmtree(file_path)
-            except Exception as e:
-                print("Failed to delete %s. Reason: %s" % (file_path, e))
-        if fs:
-            fs.clear_cache()
-
-
-def lscache(cache_path: str = "", prt=True):
-    """ Decode and list cache folder content
-
-        Parameters
-        ----------
-        cache_path: str
-        prt: bool, default=True
-            Return a printable string or a :class:`pandas.DataFrame`
-
-        Returns
-        -------
-        str or :class:`pandas.DataFrame`
-    """
-    from datetime import datetime
-    import math
-    summary = []
-
-    cache_path = OPTIONS['cachedir'] if cache_path == '' else cache_path
-    apath = os.path.abspath(cache_path)
-    log.debug("Listing cache content at: %s" % cache_path)
-
-    def convert_size(size_bytes):
-        if size_bytes == 0:
-            return "0B"
-        size_name = ("B", "KB", "MB", "GB", "TB", "PB", "EB", "ZB", "YB")
-        i = int(math.floor(math.log(size_bytes, 1024)))
-        p = math.pow(1024, i)
-        s = round(size_bytes / p, 2)
-        return "%s %s" % (s, size_name[i])
-
-    cached_files = []
-    fn = os.path.join(apath, "cache")
-    if os.path.exists(fn):
-        with open(fn, "rb") as f:
-            loaded_cached_files = pickle.load(f)  # nosec B301 because files controlled internally
-            for c in loaded_cached_files.values():
-                if isinstance(c["blocks"], list):
-                    c["blocks"] = set(c["blocks"])
-            cached_files.append(loaded_cached_files)
-    else:
-        raise FileSystemHasNoCache("No fsspec cache system at: %s" % apath)
-
-    cached_files = cached_files or [{}]
-    cached_files = cached_files[-1]
-
-    N_FILES = len(cached_files)
-    TOTAL_SIZE = 0
-    for cfile in cached_files:
-        path = os.path.join(apath, cached_files[cfile]['fn'])
-        TOTAL_SIZE += os.path.getsize(path)
-
-    summary.append("%s %s" % ("=" * 20, "%i files in fsspec cache folder (%s)" % (N_FILES, convert_size(TOTAL_SIZE))))
-    summary.append("lscache %s" % os.path.sep.join([apath, ""]))
-    summary.append("=" * 20)
-
-    listing = {'fn': [], 'size': [], 'time': [], 'original': [], 'uid': [], 'blocks': []}
-    for cfile in cached_files:
-        summary.append("- %s" % cached_files[cfile]['fn'])
-        listing['fn'].append(cached_files[cfile]['fn'])
-
-        path = os.path.join(cache_path, cached_files[cfile]['fn'])
-        summary.append("\t%8s: %s" % ('SIZE', convert_size(os.path.getsize(path))))
-        listing['size'].append(os.path.getsize(path))
-
-        key = 'time'
-        ts = cached_files[cfile][key]
-        tsf = pd.to_datetime(datetime.fromtimestamp(ts)).strftime("%c")
-        summary.append("\t%8s: %s (%s)" % (key, tsf, ts))
-        listing['time'].append(pd.to_datetime(datetime.fromtimestamp(ts)))
-
-        if version.parse(fsspec.__version__) > version.parse("0.8.7"):
-            key = 'original'
-            summary.append("\t%8s: %s" % (key, cached_files[cfile][key]))
-            listing[key].append(cached_files[cfile][key])
-
-        key = 'uid'
-        summary.append("\t%8s: %s" % (key, cached_files[cfile][key]))
-        listing[key].append(cached_files[cfile][key])
-
-        key = 'blocks'
-        summary.append("\t%8s: %s" % (key, cached_files[cfile][key]))
-        listing[key].append(cached_files[cfile][key])
-
-    summary.append("=" * 20)
-    summary = "\n".join(summary)
-    if prt:
-        # Return string to be printed:
-        return summary
-    else:
-        # Return dataframe listing:
-        # log.debug(summary)
-        return pd.DataFrame(listing)
-
-
 def get_sys_info():
     """Returns system information as a dict"""
 
@@ -621,276 +508,6 @@ def _regular_interp(x, y, target_values):
     return remapped
 
 
-class Chunker:
-    """ To chunk fetcher requests """
-
-    # Default maximum chunks size for all possible request parameters
-    default_chunksize = {
-        "box": {
-            "lon": 20,  # degree
-            "lat": 20,  # degree
-            "dpt": 500,  # meters/db
-            "time": 3 * 30,
-        },  # Days
-        "wmo": {"wmo": 5, "cyc": 100},  # Nb of floats
-    }  # Nb of cycles
-
-    def __init__(self, request: dict, chunks: str = "auto", chunksize: dict = {}):
-        """ Create a request Chunker
-
-        Allow to easily split an access point request into chunks
-
-        Parameters
-        ----------
-        request: dict
-            Access point request to be chunked. One of the following:
-
-            - {'box': [lon_min, lon_max, lat_min, lat_max, dpt_min, dpt_max, time_min, time_max]}
-            - {'box': [lon_min, lon_max, lat_min, lat_max, dpt_min, dpt_max]}
-            - {'wmo': [wmo1, wmo2, ...], 'cyc': [0,1, ...]}
-        chunks: 'auto' or dict
-            Dictionary with request access point as keys and number of chunks to create as values.
-
-            Eg: {'wmo':10} will create a maximum of 10 chunks along WMOs.
-        chunksize: dict, optional
-            Dictionary with request access point as keys and chunk size as values (used as maximum values in
-            'auto' chunking).
-
-            Eg: {'wmo': 5} will create chunks with as many as 5 WMOs each.
-
-        """
-        self.request = request
-
-        if "box" in self.request:
-            is_box(self.request["box"])
-            if len(self.request["box"]) == 8:
-                self.this_chunker = self._chunker_box4d
-            elif len(self.request["box"]) == 6:
-                self.this_chunker = self._chunker_box3d
-        elif "wmo" in self.request:
-            self.this_chunker = self._chunker_wmo
-        else:
-            raise InvalidFetcherAccessPoint(
-                "'%s' not valid access point" % ",".join(self.request.keys())
-            )
-
-        default = self.default_chunksize[[k for k in self.request.keys()][0]]
-        if len(chunksize) == 0:  # chunksize = {}
-            chunksize = default
-        if not isinstance(chunksize, collectionsAbc.Mapping):
-            raise ValueError("chunksize must be mappable")
-        else:  # merge with default:
-            chunksize = {**default, **chunksize}
-        self.chunksize = collections.OrderedDict(sorted(chunksize.items()))
-
-        default = {k: "auto" for k in self.chunksize.keys()}
-        if chunks == "auto":  # auto for all
-            chunks = default
-        elif len(chunks) == 0:  # chunks = {}, i.e. chunk=1 for all
-            chunks = {k: 1 for k in self.request}
-        if not isinstance(chunks, collectionsAbc.Mapping):
-            raise ValueError("chunks must be 'auto' or mappable")
-        chunks = {**default, **chunks}
-        self.chunks = collections.OrderedDict(sorted(chunks.items()))
-
-    def _split(self, lst, n=1):
-        """Yield successive n-sized chunks from lst"""
-        for i in range(0, len(lst), n):
-            yield lst[i: i + n]
-
-    def _split_list_bychunknb(self, lst, n=1):
-        """Split list in n-imposed chunks of similar size
-            The last chunk may contain less element than the others, depending on the size of the list.
-        """
-        res = []
-        s = int(np.floor_divide(len(lst), n))
-        for i in self._split(lst, s):
-            res.append(i)
-        if len(res) > n:
-            res[n - 1::] = [reduce(lambda i, j: i + j, res[n - 1::])]
-        return res
-
-    def _split_list_bychunksize(self, lst, max_size=1):
-        """Split list in chunks of imposed size
-            The last chunk may contain less element than the others, depending on the size of the list.
-        """
-        res = []
-        for i in self._split(lst, max_size):
-            res.append(i)
-        return res
-
-    def _split_box(self, large_box, n=1, d="x"):  # noqa: C901
-        """Split a box domain in one direction in n-imposed equal chunks """
-        if d == "x":
-            i_left, i_right = 0, 1
-        if d == "y":
-            i_left, i_right = 2, 3
-        if d == "z":
-            i_left, i_right = 4, 5
-        if d == "t":
-            i_left, i_right = 6, 7
-        if n == 1:
-            return [large_box]
-        boxes = []
-        if d in ["x", "y", "z"]:
-            n += 1  # Required because we split in linspace
-            bins = np.linspace(large_box[i_left], large_box[i_right], n)
-            for ii, left in enumerate(bins):
-                if ii < len(bins) - 1:
-                    right = bins[ii + 1]
-                    this_box = large_box.copy()
-                    this_box[i_left] = left
-                    this_box[i_right] = right
-                    boxes.append(this_box)
-        elif "t" in d:
-            dates = pd.to_datetime(large_box[i_left: i_right + 1])
-            date_bounds = [
-                d.strftime("%Y%m%d%H%M%S")
-                for d in pd.date_range(dates[0], dates[1], periods=n + 1)
-            ]
-            for i1, i2 in zip(np.arange(0, n), np.arange(1, n + 1)):
-                left, right = date_bounds[i1], date_bounds[i2]
-                this_box = large_box.copy()
-                this_box[i_left] = left
-                this_box[i_right] = right
-                boxes.append(this_box)
-        return boxes
-
-    def _split_this_4Dbox(self, box, nx=1, ny=1, nz=1, nt=1):
-        box_list = []
-        split_x = self._split_box(box, n=nx, d="x")
-        for bx in split_x:
-            split_y = self._split_box(bx, n=ny, d="y")
-            for bxy in split_y:
-                split_z = self._split_box(bxy, n=nz, d="z")
-                for bxyz in split_z:
-                    split_t = self._split_box(bxyz, n=nt, d="t")
-                    for bxyzt in split_t:
-                        box_list.append(bxyzt)
-        return box_list
-
-    def _split_this_3Dbox(self, box, nx=1, ny=1, nz=1):
-        box_list = []
-        split_x = self._split_box(box, n=nx, d="x")
-        for bx in split_x:
-            split_y = self._split_box(bx, n=ny, d="y")
-            for bxy in split_y:
-                split_z = self._split_box(bxy, n=nz, d="z")
-                for bxyz in split_z:
-                    box_list.append(bxyz)
-        return box_list
-
-    def _chunker_box4d(self, request, chunks, chunks_maxsize):  # noqa: C901
-        BOX = request["box"]
-        n_chunks = chunks
-        for axis, n in n_chunks.items():
-            if n == "auto":
-                if axis == "lon":
-                    Lx = BOX[1] - BOX[0]
-                    if Lx > chunks_maxsize["lon"]:  # Max box size in longitude
-                        n_chunks["lon"] = int(
-                            np.ceil(np.divide(Lx, chunks_maxsize["lon"]))
-                        )
-                    else:
-                        n_chunks["lon"] = 1
-                if axis == "lat":
-                    Ly = BOX[3] - BOX[2]
-                    if Ly > chunks_maxsize["lat"]:  # Max box size in latitude
-                        n_chunks["lat"] = int(
-                            np.ceil(np.divide(Ly, chunks_maxsize["lat"]))
-                        )
-                    else:
-                        n_chunks["lat"] = 1
-                if axis == "dpt":
-                    Lz = BOX[5] - BOX[4]
-                    if Lz > chunks_maxsize["dpt"]:  # Max box size in depth
-                        n_chunks["dpt"] = int(
-                            np.ceil(np.divide(Lz, chunks_maxsize["dpt"]))
-                        )
-                    else:
-                        n_chunks["dpt"] = 1
-                if axis == "time":
-                    Lt = np.timedelta64(
-                        pd.to_datetime(BOX[7]) - pd.to_datetime(BOX[6]), "D"
-                    )
-                    MaxLen = np.timedelta64(chunks_maxsize["time"], "D")
-                    if Lt > MaxLen:  # Max box size in time
-                        n_chunks["time"] = int(np.ceil(np.divide(Lt, MaxLen)))
-                    else:
-                        n_chunks["time"] = 1
-
-        boxes = self._split_this_4Dbox(
-            BOX,
-            nx=n_chunks["lon"],
-            ny=n_chunks["lat"],
-            nz=n_chunks["dpt"],
-            nt=n_chunks["time"],
-        )
-        return {"chunks": sorted(n_chunks), "values": boxes}
-
-    def _chunker_box3d(self, request, chunks, chunks_maxsize):
-        BOX = request["box"]
-        n_chunks = chunks
-        for axis, n in n_chunks.items():
-            if n == "auto":
-                if axis == "lon":
-                    Lx = BOX[1] - BOX[0]
-                    if Lx > chunks_maxsize["lon"]:  # Max box size in longitude
-                        n_chunks["lon"] = int(
-                            np.floor_divide(Lx, chunks_maxsize["lon"])
-                        )
-                    else:
-                        n_chunks["lon"] = 1
-                if axis == "lat":
-                    Ly = BOX[3] - BOX[2]
-                    if Ly > chunks_maxsize["lat"]:  # Max box size in latitude
-                        n_chunks["lat"] = int(
-                            np.floor_divide(Ly, chunks_maxsize["lat"])
-                        )
-                    else:
-                        n_chunks["lat"] = 1
-                if axis == "dpt":
-                    Lz = BOX[5] - BOX[4]
-                    if Lz > chunks_maxsize["dpt"]:  # Max box size in depth
-                        n_chunks["dpt"] = int(
-                            np.floor_divide(Lz, chunks_maxsize["dpt"])
-                        )
-                    else:
-                        n_chunks["dpt"] = 1
-                # if axis == 'time':
-                #     Lt = np.timedelta64(pd.to_datetime(BOX[5]) - pd.to_datetime(BOX[4]), 'D')
-                #     MaxLen = np.timedelta64(chunks_maxsize['time'], 'D')
-                #     if Lt > MaxLen:  # Max box size in time
-                #         n_chunks['time'] = int(np.floor_divide(Lt, MaxLen))
-                #     else:
-                #         n_chunks['time'] = 1
-        boxes = self._split_this_3Dbox(
-            BOX, nx=n_chunks["lon"], ny=n_chunks["lat"], nz=n_chunks["dpt"]
-        )
-        return {"chunks": sorted(n_chunks), "values": boxes}
-
-    def _chunker_wmo(self, request, chunks, chunks_maxsize):
-        WMO = request["wmo"]
-        n_chunks = chunks
-        if n_chunks["wmo"] == "auto":
-            wmo_grps = self._split_list_bychunksize(WMO, max_size=chunks_maxsize["wmo"])
-        else:
-            n = np.min([n_chunks["wmo"], len(WMO)])
-            wmo_grps = self._split_list_bychunknb(WMO, n=n)
-        n_chunks["wmo"] = len(wmo_grps)
-        return {"chunks": sorted(n_chunks), "values": wmo_grps}
-
-    def fit_transform(self):
-        """ Chunk a fetcher request
-
-        Returns
-        -------
-        list
-        """
-        self._results = self.this_chunker(self.request, self.chunks, self.chunksize)
-        # self.chunks = self._results['chunks']
-        return self._results["values"]
-
 
 def format_oneline(s, max_width=65):
     """ Return a string formatted for a line print """
@@ -1367,258 +984,6 @@ def fix_localhost(host):
     return dict(sorted(output.items()))
 
 
-class RegistryItem(ABC):
-    """Prototype for possible custom items in a Registry"""
-    @property
-    @abstractmethod
-    def value(self):
-        raise NotImplementedError("Not implemented")
-
-    @property
-    @abstractmethod
-    def isvalid(self, item):
-        raise NotImplementedError("Not implemented")
-
-    @abstractmethod
-    def __str__(self):
-        raise NotImplementedError("Not implemented")
-
-    @abstractmethod
-    def __repr__(self):
-        raise NotImplementedError("Not implemented")
-
-
-class float_wmo(RegistryItem):
-    """Argo float WMO number object"""
-
-    def __init__(self, WMO_number, errors='raise'):
-        """Create an Argo float WMO number object
-
-        Parameters
-        ----------
-        WMO_number: object
-            Anything that could be casted as an integer
-        errors: {'raise', 'warn', 'ignore'}
-            Possibly raises a ValueError exception or UserWarning, otherwise fails silently if WMO_number is not valid
-
-        Returns
-        -------
-        :class:`argopy.utilities.float_wmo`
-        """
-        self.errors = errors
-        if isinstance(WMO_number, float_wmo):
-            item = WMO_number.value
-        else:
-            item = check_wmo(WMO_number, errors=self.errors)[0]  # This will automatically validate item
-        self.item = item
-
-    @property
-    def isvalid(self):
-        """Check if WMO number is valid"""
-        return is_wmo(self.item, errors=self.errors)
-        # return True  # Because it was checked at instantiation
-
-    @property
-    def value(self):
-        """Return WMO number as in integer"""
-        return int(self.item)
-
-    def __str__(self):
-        # return "%s" % check_wmo(self.item)[0]
-        return "%s" % self.item
-
-    def __repr__(self):
-        return f"WMO({self.item})"
-
-    def __check_other__(self, other):
-        return check_wmo(other)[0] if type(other) is not float_wmo else other.item
-
-    def __eq__(self, other):
-        return self.item.__eq__(self.__check_other__(other))
-
-    def __ne__(self, other):
-        return self.item.__ne__(self.__check_other__(other))
-
-    def __gt__(self, other):
-        return self.item.__gt__(self.__check_other__(other))
-
-    def __lt__(self, other):
-        return self.item.__lt__(self.__check_other__(other))
-
-    def __ge__(self, other):
-        return self.item.__ge__(self.__check_other__(other))
-
-    def __le__(self, other):
-        return self.item.__le__(self.__check_other__(other))
-
-    def __hash__(self):
-        return hash(self.item)
-
-
-class Registry(UserList):
-    """A list manager can that validate item type
-
-    Examples
-    --------
-    You can commit new entry to the registry, one by one:
-
-        >>> R = Registry(name='file')
-        >>> R.commit('meds/4901105/profiles/D4901105_017.nc')
-        >>> R.commit('aoml/1900046/profiles/D1900046_179.nc')
-
-    Or with a list:
-
-        >>> R = Registry(name='My floats', dtype='wmo')
-        >>> R.commit([2901746, 4902252])
-
-    And also at instantiation time (name and dtype are optional):
-
-        >>> R = Registry([2901746, 4902252], name='My floats', dtype=float_wmo)
-
-    Registry can be used like a list.
-
-    It is iterable:
-
-        >>> for wmo in R:
-        >>>     print(wmo)
-
-    It has a ``len`` property:
-
-        >>> len(R)
-
-    It can be checked for values:
-
-        >>> 4902252 in R
-
-    You can also remove items from the registry, again one by one or with a list:
-
-        >>> R.remove('2901746')
-
-    """
-
-    def _complain(self, msg):
-        if self._invalid == 'raise':
-            raise ValueError(msg)
-        elif self._invalid == 'warn':
-            warnings.warn(msg)
-        else:
-            log.debug(msg)
-
-    def _str(self, item):
-        is_valid = isinstance(item, str)
-        if not is_valid:
-            self._complain("%s is not a valid %s" % (str(item), self.dtype))
-        return is_valid
-
-    def _dict(self, item):
-        is_valid = isinstance(item, dict)
-        if not is_valid:
-            self._complain("%s is not a valid %s" % (str(item), self.dtype))
-        return is_valid
-
-    def _wmo(self, item):
-        return item.isvalid
-
-    def __init__(self, initlist=None, name: str = 'unnamed', dtype='str', invalid='raise'):
-        """Create a registry, i.e. a controlled list
-
-        Parameters
-        ----------
-        initlist: list, optional
-            List of values to register
-        name: str, default: 'unnamed'
-            Name of the Registry
-        dtype: :class:`str` or dtype, default: :class:`str`
-            Data type of registry content. Supported values are: 'str', 'wmo', float_wmo
-        invalid: str, default: 'raise'
-            Define what do to when a new item is not valid. Can be 'raise' or 'ignore'
-        """
-        self.name = name
-        self._invalid = invalid
-        if repr(dtype) == "<class 'str'>" or dtype == 'str':
-            self._validator = self._str
-            self.dtype = str
-        elif dtype == float_wmo or str(dtype).lower() == 'wmo':
-            self._validator = self._wmo
-            self.dtype = float_wmo
-        elif repr(dtype) == "<class 'dict'>" or dtype == 'dict':
-            self._validator = self._dict
-            self.dtype = dict
-        elif hasattr(dtype, 'isvalid'):
-            self._validator = dtype.isvalid
-            self.dtype = dtype
-        else:
-            raise ValueError("Unrecognised Registry data type '%s'" % dtype)
-
-        if initlist is not None:
-            initlist = self._process_items(initlist)
-        super().__init__(initlist)
-
-    def __repr__(self):
-        summary = ["<argopy.registry>%s" % str(self.dtype)]
-        summary.append("Name: %s" % self.name)
-        N = len(self.data)
-        msg = "Nitems: %s" % N if N > 1 else "Nitem: %s" % N
-        summary.append(msg)
-        if N > 0:
-            items = [str(item) for item in self.data]
-            # msg = format_oneline("[%s]" % "; ".join(items), max_width=120)
-            msg = "[%s]" % "; ".join(items)
-            summary.append("Content: %s" % msg)
-        return "\n".join(summary)
-
-    def _process_items(self, items):
-        if not isinstance(items, list):
-            items = [items]
-        if self.dtype == float_wmo:
-            items = [float_wmo(item, errors=self._invalid) for item in items]
-        return items
-
-    def commit(self, values):
-        """R.commit(values) -- append values to the end of the registry if not already in"""
-        items = self._process_items(values)
-        for item in items:
-            if item not in self.data and self._validator(item):
-                super().append(item)
-        return self
-
-    def append(self, value):
-        """R.append(value) -- append value to the end of the registry"""
-        items = self._process_items(value)
-        for item in items:
-            if self._validator(item):
-                super().append(item)
-        return self
-
-    def extend(self, other):
-        """R.extend(iterable) -- extend registry by appending elements from the iterable"""
-        self.append(other)
-        return self
-
-    def remove(self, values):
-        """R.remove(valueS) -- remove first occurrence of values."""
-        items = self._process_items(values)
-        for item in items:
-            if item in self.data:
-                super().remove(item)
-        return self
-
-    def insert(self, index, value):
-        """R.insert(index, value) -- insert value before index."""
-        item = self._process_items(value)[0]
-        if self._validator(item):
-            super().insert(index, item)
-        return self
-
-    def __copy__(self):
-        # Called with copy.copy(R)
-        return Registry(copy.copy(self.data), dtype=self.dtype)
-
-    def copy(self):
-        """Return a shallow copy of the registry"""
-        return self.__copy__()
-
-
 def log_argopy_callerstack(level='debug'):
     """log the caller’s stack"""
     froot = str(pathlib.Path(__file__).parent.resolve())
diff --git a/argopy/utils/__init__.py b/argopy/utils/__init__.py
index 8acfbd69..69f2bb23 100644
--- a/argopy/utils/__init__.py
+++ b/argopy/utils/__init__.py
@@ -1,4 +1,3 @@
-from .monitored_threadpool import MyThreadPoolExecutor as MonitoredThreadPoolExecutor
 from .checkers import (
     is_box, is_indexbox,
     is_list_of_strings, is_list_of_dicts, is_list_of_datasets, is_list_equal,
@@ -17,13 +16,13 @@
     list_standard_variables,
     list_multiprofile_file_variables
 )
-
+from .caching import clear_cache, lscache
+from .monitored_threadpool import MyThreadPoolExecutor as MonitoredThreadPoolExecutor
+from .chunking import Chunker
+from .accessories import Registry, float_wmo
 
 
 __all__ = (
-    # Classes:
-    "MonitoredThreadPoolExecutor",
-
     # Checkers:
     "is_box", "is_indexbox",
     "is_list_of_strings", "is_list_of_dicts", "is_list_of_datasets", "is_list_equal",
@@ -47,4 +46,14 @@
     "list_available_index_src",
     "list_standard_variables",
     "list_multiprofile_file_variables",
+
+    # Cache management:
+    "clear_cache", "lscache",
+
+    # Computation and performances:
+    "MonitoredThreadPoolExecutor",
+    "Chunker",
+
+    # Accessories classes (specific objects):
+    "Registry", "float_wmo"
 )
diff --git a/argopy/utils/accessories.py b/argopy/utils/accessories.py
new file mode 100644
index 00000000..5be8c7b0
--- /dev/null
+++ b/argopy/utils/accessories.py
@@ -0,0 +1,262 @@
+from abc import ABC, abstractmethod
+from collections import UserList
+import warnings
+import logging
+import copy
+
+from .checkers import check_wmo, is_wmo
+
+
+log = logging.getLogger("argopy.utils.accessories")
+
+
+class RegistryItem(ABC):
+    """Prototype for possible custom items in a Registry"""
+    @property
+    @abstractmethod
+    def value(self):
+        raise NotImplementedError("Not implemented")
+
+    @property
+    @abstractmethod
+    def isvalid(self, item):
+        raise NotImplementedError("Not implemented")
+
+    @abstractmethod
+    def __str__(self):
+        raise NotImplementedError("Not implemented")
+
+    @abstractmethod
+    def __repr__(self):
+        raise NotImplementedError("Not implemented")
+
+
+class float_wmo(RegistryItem):
+    """Argo float WMO number object"""
+
+    def __init__(self, WMO_number, errors='raise'):
+        """Create an Argo float WMO number object
+
+        Parameters
+        ----------
+        WMO_number: object
+            Anything that could be casted as an integer
+        errors: {'raise', 'warn', 'ignore'}
+            Possibly raises a ValueError exception or UserWarning, otherwise fails silently if WMO_number is not valid
+
+        Returns
+        -------
+        :class:`argopy.utilities.float_wmo`
+        """
+        self.errors = errors
+        if isinstance(WMO_number, float_wmo):
+            item = WMO_number.value
+        else:
+            item = check_wmo(WMO_number, errors=self.errors)[0]  # This will automatically validate item
+        self.item = item
+
+    @property
+    def isvalid(self):
+        """Check if WMO number is valid"""
+        return is_wmo(self.item, errors=self.errors)
+        # return True  # Because it was checked at instantiation
+
+    @property
+    def value(self):
+        """Return WMO number as in integer"""
+        return int(self.item)
+
+    def __str__(self):
+        # return "%s" % check_wmo(self.item)[0]
+        return "%s" % self.item
+
+    def __repr__(self):
+        return f"WMO({self.item})"
+
+    def __check_other__(self, other):
+        return check_wmo(other)[0] if type(other) is not float_wmo else other.item
+
+    def __eq__(self, other):
+        return self.item.__eq__(self.__check_other__(other))
+
+    def __ne__(self, other):
+        return self.item.__ne__(self.__check_other__(other))
+
+    def __gt__(self, other):
+        return self.item.__gt__(self.__check_other__(other))
+
+    def __lt__(self, other):
+        return self.item.__lt__(self.__check_other__(other))
+
+    def __ge__(self, other):
+        return self.item.__ge__(self.__check_other__(other))
+
+    def __le__(self, other):
+        return self.item.__le__(self.__check_other__(other))
+
+    def __hash__(self):
+        return hash(self.item)
+
+
+class Registry(UserList):
+    """A list manager can that validate item type
+
+    Examples
+    --------
+    You can commit new entry to the registry, one by one:
+
+        >>> R = Registry(name='file')
+        >>> R.commit('meds/4901105/profiles/D4901105_017.nc')
+        >>> R.commit('aoml/1900046/profiles/D1900046_179.nc')
+
+    Or with a list:
+
+        >>> R = Registry(name='My floats', dtype='wmo')
+        >>> R.commit([2901746, 4902252])
+
+    And also at instantiation time (name and dtype are optional):
+
+        >>> R = Registry([2901746, 4902252], name='My floats', dtype=float_wmo)
+
+    Registry can be used like a list.
+
+    It is iterable:
+
+        >>> for wmo in R:
+        >>>     print(wmo)
+
+    It has a ``len`` property:
+
+        >>> len(R)
+
+    It can be checked for values:
+
+        >>> 4902252 in R
+
+    You can also remove items from the registry, again one by one or with a list:
+
+        >>> R.remove('2901746')
+
+    """
+
+    def _complain(self, msg):
+        if self._invalid == 'raise':
+            raise ValueError(msg)
+        elif self._invalid == 'warn':
+            warnings.warn(msg)
+        else:
+            log.debug(msg)
+
+    def _str(self, item):
+        is_valid = isinstance(item, str)
+        if not is_valid:
+            self._complain("%s is not a valid %s" % (str(item), self.dtype))
+        return is_valid
+
+    def _dict(self, item):
+        is_valid = isinstance(item, dict)
+        if not is_valid:
+            self._complain("%s is not a valid %s" % (str(item), self.dtype))
+        return is_valid
+
+    def _wmo(self, item):
+        return item.isvalid
+
+    def __init__(self, initlist=None, name: str = 'unnamed', dtype='str', invalid='raise'):
+        """Create a registry, i.e. a controlled list
+
+        Parameters
+        ----------
+        initlist: list, optional
+            List of values to register
+        name: str, default: 'unnamed'
+            Name of the Registry
+        dtype: :class:`str` or dtype, default: :class:`str`
+            Data type of registry content. Supported values are: 'str', 'wmo', float_wmo
+        invalid: str, default: 'raise'
+            Define what do to when a new item is not valid. Can be 'raise' or 'ignore'
+        """
+        self.name = name
+        self._invalid = invalid
+        if repr(dtype) == "<class 'str'>" or dtype == 'str':
+            self._validator = self._str
+            self.dtype = str
+        elif dtype == float_wmo or str(dtype).lower() == 'wmo':
+            self._validator = self._wmo
+            self.dtype = float_wmo
+        elif repr(dtype) == "<class 'dict'>" or dtype == 'dict':
+            self._validator = self._dict
+            self.dtype = dict
+        elif hasattr(dtype, 'isvalid'):
+            self._validator = dtype.isvalid
+            self.dtype = dtype
+        else:
+            raise ValueError("Unrecognised Registry data type '%s'" % dtype)
+
+        if initlist is not None:
+            initlist = self._process_items(initlist)
+        super().__init__(initlist)
+
+    def __repr__(self):
+        summary = ["<argopy.registry>%s" % str(self.dtype)]
+        summary.append("Name: %s" % self.name)
+        N = len(self.data)
+        msg = "Nitems: %s" % N if N > 1 else "Nitem: %s" % N
+        summary.append(msg)
+        if N > 0:
+            items = [str(item) for item in self.data]
+            # msg = format_oneline("[%s]" % "; ".join(items), max_width=120)
+            msg = "[%s]" % "; ".join(items)
+            summary.append("Content: %s" % msg)
+        return "\n".join(summary)
+
+    def _process_items(self, items):
+        if not isinstance(items, list):
+            items = [items]
+        if self.dtype == float_wmo:
+            items = [float_wmo(item, errors=self._invalid) for item in items]
+        return items
+
+    def commit(self, values):
+        """R.commit(values) -- append values to the end of the registry if not already in"""
+        items = self._process_items(values)
+        for item in items:
+            if item not in self.data and self._validator(item):
+                super().append(item)
+        return self
+
+    def append(self, value):
+        """R.append(value) -- append value to the end of the registry"""
+        items = self._process_items(value)
+        for item in items:
+            if self._validator(item):
+                super().append(item)
+        return self
+
+    def extend(self, other):
+        """R.extend(iterable) -- extend registry by appending elements from the iterable"""
+        self.append(other)
+        return self
+
+    def remove(self, values):
+        """R.remove(valueS) -- remove first occurrence of values."""
+        items = self._process_items(values)
+        for item in items:
+            if item in self.data:
+                super().remove(item)
+        return self
+
+    def insert(self, index, value):
+        """R.insert(index, value) -- insert value before index."""
+        item = self._process_items(value)[0]
+        if self._validator(item):
+            super().insert(index, item)
+        return self
+
+    def __copy__(self):
+        # Called with copy.copy(R)
+        return Registry(copy.copy(self.data), dtype=self.dtype)
+
+    def copy(self):
+        """Return a shallow copy of the registry"""
+        return self.__copy__()
diff --git a/argopy/utils/caching.py b/argopy/utils/caching.py
new file mode 100644
index 00000000..7e257f23
--- /dev/null
+++ b/argopy/utils/caching.py
@@ -0,0 +1,122 @@
+import os
+import shutil
+import logging
+import pickle
+import fsspec
+import pandas as pd
+from packaging import version
+from ..options import OPTIONS
+from ..errors import FileSystemHasNoCache
+
+log = logging.getLogger("argopy.utils.caching")
+
+
+def clear_cache(fs=None):
+    """ Delete argopy cache folder content """
+    if os.path.exists(OPTIONS["cachedir"]):
+        # shutil.rmtree(OPTIONS["cachedir"])
+        for filename in os.listdir(OPTIONS["cachedir"]):
+            file_path = os.path.join(OPTIONS["cachedir"], filename)
+            try:
+                if os.path.isfile(file_path) or os.path.islink(file_path):
+                    os.unlink(file_path)
+                elif os.path.isdir(file_path):
+                    shutil.rmtree(file_path)
+            except Exception as e:
+                print("Failed to delete %s. Reason: %s" % (file_path, e))
+        if fs:
+            fs.clear_cache()
+
+
+def lscache(cache_path: str = "", prt=True):
+    """ Decode and list cache folder content
+
+        Parameters
+        ----------
+        cache_path: str
+        prt: bool, default=True
+            Return a printable string or a :class:`pandas.DataFrame`
+
+        Returns
+        -------
+        str or :class:`pandas.DataFrame`
+    """
+    from datetime import datetime
+    import math
+    summary = []
+
+    cache_path = OPTIONS['cachedir'] if cache_path == '' else cache_path
+    apath = os.path.abspath(cache_path)
+    log.debug("Listing cache content at: %s" % cache_path)
+
+    def convert_size(size_bytes):
+        if size_bytes == 0:
+            return "0B"
+        size_name = ("B", "KB", "MB", "GB", "TB", "PB", "EB", "ZB", "YB")
+        i = int(math.floor(math.log(size_bytes, 1024)))
+        p = math.pow(1024, i)
+        s = round(size_bytes / p, 2)
+        return "%s %s" % (s, size_name[i])
+
+    cached_files = []
+    fn = os.path.join(apath, "cache")
+    if os.path.exists(fn):
+        with open(fn, "rb") as f:
+            loaded_cached_files = pickle.load(f)  # nosec B301 because files controlled internally
+            for c in loaded_cached_files.values():
+                if isinstance(c["blocks"], list):
+                    c["blocks"] = set(c["blocks"])
+            cached_files.append(loaded_cached_files)
+    else:
+        raise FileSystemHasNoCache("No fsspec cache system at: %s" % apath)
+
+    cached_files = cached_files or [{}]
+    cached_files = cached_files[-1]
+
+    N_FILES = len(cached_files)
+    TOTAL_SIZE = 0
+    for cfile in cached_files:
+        path = os.path.join(apath, cached_files[cfile]['fn'])
+        TOTAL_SIZE += os.path.getsize(path)
+
+    summary.append("%s %s" % ("=" * 20, "%i files in fsspec cache folder (%s)" % (N_FILES, convert_size(TOTAL_SIZE))))
+    summary.append("lscache %s" % os.path.sep.join([apath, ""]))
+    summary.append("=" * 20)
+
+    listing = {'fn': [], 'size': [], 'time': [], 'original': [], 'uid': [], 'blocks': []}
+    for cfile in cached_files:
+        summary.append("- %s" % cached_files[cfile]['fn'])
+        listing['fn'].append(cached_files[cfile]['fn'])
+
+        path = os.path.join(cache_path, cached_files[cfile]['fn'])
+        summary.append("\t%8s: %s" % ('SIZE', convert_size(os.path.getsize(path))))
+        listing['size'].append(os.path.getsize(path))
+
+        key = 'time'
+        ts = cached_files[cfile][key]
+        tsf = pd.to_datetime(datetime.fromtimestamp(ts)).strftime("%c")
+        summary.append("\t%8s: %s (%s)" % (key, tsf, ts))
+        listing['time'].append(pd.to_datetime(datetime.fromtimestamp(ts)))
+
+        if version.parse(fsspec.__version__) > version.parse("0.8.7"):
+            key = 'original'
+            summary.append("\t%8s: %s" % (key, cached_files[cfile][key]))
+            listing[key].append(cached_files[cfile][key])
+
+        key = 'uid'
+        summary.append("\t%8s: %s" % (key, cached_files[cfile][key]))
+        listing[key].append(cached_files[cfile][key])
+
+        key = 'blocks'
+        summary.append("\t%8s: %s" % (key, cached_files[cfile][key]))
+        listing[key].append(cached_files[cfile][key])
+
+    summary.append("=" * 20)
+    summary = "\n".join(summary)
+    if prt:
+        # Return string to be printed:
+        return summary
+    else:
+        # Return dataframe listing:
+        # log.debug(summary)
+        return pd.DataFrame(listing)
diff --git a/argopy/utils/chunking.py b/argopy/utils/chunking.py
new file mode 100644
index 00000000..4ff7459f
--- /dev/null
+++ b/argopy/utils/chunking.py
@@ -0,0 +1,282 @@
+import numpy as np
+import pandas as pd
+from functools import reduce
+from ..errors import InvalidFetcherAccessPoint
+from . import is_box
+
+import collections
+try:
+    collectionsAbc = collections.abc
+except AttributeError:
+    collectionsAbc = collections
+
+
+class Chunker:
+    """ To chunk fetcher requests """
+
+    # Default maximum chunks size for all possible request parameters
+    default_chunksize = {
+        "box": {
+            "lon": 20,  # degree
+            "lat": 20,  # degree
+            "dpt": 500,  # meters/db
+            "time": 3 * 30,
+        },  # Days
+        "wmo": {"wmo": 5, "cyc": 100},  # Nb of floats
+    }  # Nb of cycles
+
+    def __init__(self, request: dict, chunks: str = "auto", chunksize: dict = {}):
+        """ Create a request Chunker
+
+        Allow to easily split an access point request into chunks
+
+        Parameters
+        ----------
+        request: dict
+            Access point request to be chunked. One of the following:
+
+            - {'box': [lon_min, lon_max, lat_min, lat_max, dpt_min, dpt_max, time_min, time_max]}
+            - {'box': [lon_min, lon_max, lat_min, lat_max, dpt_min, dpt_max]}
+            - {'wmo': [wmo1, wmo2, ...], 'cyc': [0,1, ...]}
+        chunks: 'auto' or dict
+            Dictionary with request access point as keys and number of chunks to create as values.
+
+            Eg: {'wmo':10} will create a maximum of 10 chunks along WMOs.
+        chunksize: dict, optional
+            Dictionary with request access point as keys and chunk size as values (used as maximum values in
+            'auto' chunking).
+
+            Eg: {'wmo': 5} will create chunks with as many as 5 WMOs each.
+
+        """
+        self.request = request
+
+        if "box" in self.request:
+            is_box(self.request["box"])
+            if len(self.request["box"]) == 8:
+                self.this_chunker = self._chunker_box4d
+            elif len(self.request["box"]) == 6:
+                self.this_chunker = self._chunker_box3d
+        elif "wmo" in self.request:
+            self.this_chunker = self._chunker_wmo
+        else:
+            raise InvalidFetcherAccessPoint(
+                "'%s' not valid access point" % ",".join(self.request.keys())
+            )
+
+        default = self.default_chunksize[[k for k in self.request.keys()][0]]
+        if len(chunksize) == 0:  # chunksize = {}
+            chunksize = default
+        if not isinstance(chunksize, collectionsAbc.Mapping):
+            raise ValueError("chunksize must be mappable")
+        else:  # merge with default:
+            chunksize = {**default, **chunksize}
+        self.chunksize = collections.OrderedDict(sorted(chunksize.items()))
+
+        default = {k: "auto" for k in self.chunksize.keys()}
+        if chunks == "auto":  # auto for all
+            chunks = default
+        elif len(chunks) == 0:  # chunks = {}, i.e. chunk=1 for all
+            chunks = {k: 1 for k in self.request}
+        if not isinstance(chunks, collectionsAbc.Mapping):
+            raise ValueError("chunks must be 'auto' or mappable")
+        chunks = {**default, **chunks}
+        self.chunks = collections.OrderedDict(sorted(chunks.items()))
+
+    def _split(self, lst, n=1):
+        """Yield successive n-sized chunks from lst"""
+        for i in range(0, len(lst), n):
+            yield lst[i: i + n]
+
+    def _split_list_bychunknb(self, lst, n=1):
+        """Split list in n-imposed chunks of similar size
+            The last chunk may contain less element than the others, depending on the size of the list.
+        """
+        res = []
+        s = int(np.floor_divide(len(lst), n))
+        for i in self._split(lst, s):
+            res.append(i)
+        if len(res) > n:
+            res[n - 1::] = [reduce(lambda i, j: i + j, res[n - 1::])]
+        return res
+
+    def _split_list_bychunksize(self, lst, max_size=1):
+        """Split list in chunks of imposed size
+            The last chunk may contain less element than the others, depending on the size of the list.
+        """
+        res = []
+        for i in self._split(lst, max_size):
+            res.append(i)
+        return res
+
+    def _split_box(self, large_box, n=1, d="x"):  # noqa: C901
+        """Split a box domain in one direction in n-imposed equal chunks """
+        if d == "x":
+            i_left, i_right = 0, 1
+        if d == "y":
+            i_left, i_right = 2, 3
+        if d == "z":
+            i_left, i_right = 4, 5
+        if d == "t":
+            i_left, i_right = 6, 7
+        if n == 1:
+            return [large_box]
+        boxes = []
+        if d in ["x", "y", "z"]:
+            n += 1  # Required because we split in linspace
+            bins = np.linspace(large_box[i_left], large_box[i_right], n)
+            for ii, left in enumerate(bins):
+                if ii < len(bins) - 1:
+                    right = bins[ii + 1]
+                    this_box = large_box.copy()
+                    this_box[i_left] = left
+                    this_box[i_right] = right
+                    boxes.append(this_box)
+        elif "t" in d:
+            dates = pd.to_datetime(large_box[i_left: i_right + 1])
+            date_bounds = [
+                d.strftime("%Y%m%d%H%M%S")
+                for d in pd.date_range(dates[0], dates[1], periods=n + 1)
+            ]
+            for i1, i2 in zip(np.arange(0, n), np.arange(1, n + 1)):
+                left, right = date_bounds[i1], date_bounds[i2]
+                this_box = large_box.copy()
+                this_box[i_left] = left
+                this_box[i_right] = right
+                boxes.append(this_box)
+        return boxes
+
+    def _split_this_4Dbox(self, box, nx=1, ny=1, nz=1, nt=1):
+        box_list = []
+        split_x = self._split_box(box, n=nx, d="x")
+        for bx in split_x:
+            split_y = self._split_box(bx, n=ny, d="y")
+            for bxy in split_y:
+                split_z = self._split_box(bxy, n=nz, d="z")
+                for bxyz in split_z:
+                    split_t = self._split_box(bxyz, n=nt, d="t")
+                    for bxyzt in split_t:
+                        box_list.append(bxyzt)
+        return box_list
+
+    def _split_this_3Dbox(self, box, nx=1, ny=1, nz=1):
+        box_list = []
+        split_x = self._split_box(box, n=nx, d="x")
+        for bx in split_x:
+            split_y = self._split_box(bx, n=ny, d="y")
+            for bxy in split_y:
+                split_z = self._split_box(bxy, n=nz, d="z")
+                for bxyz in split_z:
+                    box_list.append(bxyz)
+        return box_list
+
+    def _chunker_box4d(self, request, chunks, chunks_maxsize):  # noqa: C901
+        BOX = request["box"]
+        n_chunks = chunks
+        for axis, n in n_chunks.items():
+            if n == "auto":
+                if axis == "lon":
+                    Lx = BOX[1] - BOX[0]
+                    if Lx > chunks_maxsize["lon"]:  # Max box size in longitude
+                        n_chunks["lon"] = int(
+                            np.ceil(np.divide(Lx, chunks_maxsize["lon"]))
+                        )
+                    else:
+                        n_chunks["lon"] = 1
+                if axis == "lat":
+                    Ly = BOX[3] - BOX[2]
+                    if Ly > chunks_maxsize["lat"]:  # Max box size in latitude
+                        n_chunks["lat"] = int(
+                            np.ceil(np.divide(Ly, chunks_maxsize["lat"]))
+                        )
+                    else:
+                        n_chunks["lat"] = 1
+                if axis == "dpt":
+                    Lz = BOX[5] - BOX[4]
+                    if Lz > chunks_maxsize["dpt"]:  # Max box size in depth
+                        n_chunks["dpt"] = int(
+                            np.ceil(np.divide(Lz, chunks_maxsize["dpt"]))
+                        )
+                    else:
+                        n_chunks["dpt"] = 1
+                if axis == "time":
+                    Lt = np.timedelta64(
+                        pd.to_datetime(BOX[7]) - pd.to_datetime(BOX[6]), "D"
+                    )
+                    MaxLen = np.timedelta64(chunks_maxsize["time"], "D")
+                    if Lt > MaxLen:  # Max box size in time
+                        n_chunks["time"] = int(np.ceil(np.divide(Lt, MaxLen)))
+                    else:
+                        n_chunks["time"] = 1
+
+        boxes = self._split_this_4Dbox(
+            BOX,
+            nx=n_chunks["lon"],
+            ny=n_chunks["lat"],
+            nz=n_chunks["dpt"],
+            nt=n_chunks["time"],
+        )
+        return {"chunks": sorted(n_chunks), "values": boxes}
+
+    def _chunker_box3d(self, request, chunks, chunks_maxsize):
+        BOX = request["box"]
+        n_chunks = chunks
+        for axis, n in n_chunks.items():
+            if n == "auto":
+                if axis == "lon":
+                    Lx = BOX[1] - BOX[0]
+                    if Lx > chunks_maxsize["lon"]:  # Max box size in longitude
+                        n_chunks["lon"] = int(
+                            np.floor_divide(Lx, chunks_maxsize["lon"])
+                        )
+                    else:
+                        n_chunks["lon"] = 1
+                if axis == "lat":
+                    Ly = BOX[3] - BOX[2]
+                    if Ly > chunks_maxsize["lat"]:  # Max box size in latitude
+                        n_chunks["lat"] = int(
+                            np.floor_divide(Ly, chunks_maxsize["lat"])
+                        )
+                    else:
+                        n_chunks["lat"] = 1
+                if axis == "dpt":
+                    Lz = BOX[5] - BOX[4]
+                    if Lz > chunks_maxsize["dpt"]:  # Max box size in depth
+                        n_chunks["dpt"] = int(
+                            np.floor_divide(Lz, chunks_maxsize["dpt"])
+                        )
+                    else:
+                        n_chunks["dpt"] = 1
+                # if axis == 'time':
+                #     Lt = np.timedelta64(pd.to_datetime(BOX[5]) - pd.to_datetime(BOX[4]), 'D')
+                #     MaxLen = np.timedelta64(chunks_maxsize['time'], 'D')
+                #     if Lt > MaxLen:  # Max box size in time
+                #         n_chunks['time'] = int(np.floor_divide(Lt, MaxLen))
+                #     else:
+                #         n_chunks['time'] = 1
+        boxes = self._split_this_3Dbox(
+            BOX, nx=n_chunks["lon"], ny=n_chunks["lat"], nz=n_chunks["dpt"]
+        )
+        return {"chunks": sorted(n_chunks), "values": boxes}
+
+    def _chunker_wmo(self, request, chunks, chunks_maxsize):
+        WMO = request["wmo"]
+        n_chunks = chunks
+        if n_chunks["wmo"] == "auto":
+            wmo_grps = self._split_list_bychunksize(WMO, max_size=chunks_maxsize["wmo"])
+        else:
+            n = np.min([n_chunks["wmo"], len(WMO)])
+            wmo_grps = self._split_list_bychunknb(WMO, n=n)
+        n_chunks["wmo"] = len(wmo_grps)
+        return {"chunks": sorted(n_chunks), "values": wmo_grps}
+
+    def fit_transform(self):
+        """ Chunk a fetcher request
+
+        Returns
+        -------
+        list
+        """
+        self._results = self.this_chunker(self.request, self.chunks, self.chunksize)
+        # self.chunks = self._results['chunks']
+        return self._results["values"]

From 28f77027b59da43eccb8b449ca026466f0cc24ab Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Fri, 8 Sep 2023 16:23:04 +0200
Subject: [PATCH 17/33] let's try this

---
 argopy/__init__.py                 |    7 +-
 argopy/stores/filesystems.py       |    2 +-
 argopy/tests/test_utilities.py     |  181 -----
 argopy/tests/test_utils_compute.py |   75 ++
 argopy/tests/test_utils_format.py  |   60 ++
 argopy/tests/test_utils_geo.py     |   42 ++
 argopy/tests/test_utils_locals.py  |   22 +
 argopy/utilities.py                | 1123 ----------------------------
 argopy/utils/__init__.py           |   34 +-
 argopy/utils/compute.py            |  193 +++++
 argopy/utils/format.py             |  185 +++++
 argopy/utils/geo.py                |  149 ++++
 argopy/utils/locals.py             |  244 ++++++
 argopy/utils/loggers.py            |   44 ++
 argopy/utils/manip.py              |  126 ++++
 argopy/utils/monitors.py           |  169 +++++
 argopy/xarray.py                   |   11 +-
 17 files changed, 1350 insertions(+), 1317 deletions(-)
 create mode 100644 argopy/tests/test_utils_compute.py
 create mode 100644 argopy/tests/test_utils_format.py
 create mode 100644 argopy/tests/test_utils_geo.py
 create mode 100644 argopy/tests/test_utils_locals.py
 delete mode 100644 argopy/utilities.py
 create mode 100644 argopy/utils/compute.py
 create mode 100644 argopy/utils/format.py
 create mode 100644 argopy/utils/geo.py
 create mode 100644 argopy/utils/locals.py
 create mode 100644 argopy/utils/loggers.py
 create mode 100644 argopy/utils/manip.py
 create mode 100644 argopy/utils/monitors.py

diff --git a/argopy/__init__.py b/argopy/__init__.py
index 8648d332..6ab892b1 100644
--- a/argopy/__init__.py
+++ b/argopy/__init__.py
@@ -29,17 +29,18 @@
 from . import tutorial  # noqa: E402
 
 # Other Import
-from . import utilities  # noqa: E402
+from . import utils as utilities  # noqa: E402
 from . import stores  # noqa: E402
 from . import errors  # noqa: E402
 from . import plot  # noqa: E402
 from .plot import dashboard, ArgoColors  # noqa: E402
-from .utilities import show_versions, show_options, clear_cache, lscache  # noqa: E402
-from .utilities import monitor_status as status  # noqa: E402
 from .options import set_options, reset_options  # noqa: E402
 from .data_fetchers import CTDRefDataFetcher  # noqa: E402
 from .stores import ArgoIndex  # noqa: E402
+from .utils import show_versions, show_options  # noqa: E402
+from .utils import clear_cache, lscache  # noqa: E402
 from .utils import MonitoredThreadPoolExecutor  # noqa: E402, F401
+from .utils import monitor_status as status  # noqa: E402
 from .related import TopoFetcher, OceanOPSDeployments, ArgoNVSReferenceTables, ArgoDocs, ArgoDOI  # noqa: E402
 
 
diff --git a/argopy/stores/filesystems.py b/argopy/stores/filesystems.py
index 42517f93..0bdbe997 100644
--- a/argopy/stores/filesystems.py
+++ b/argopy/stores/filesystems.py
@@ -48,7 +48,7 @@
     ErddapHTTPNotFound,
 )
 from abc import ABC, abstractmethod
-from ..utilities import (
+from ..utils import (
     drop_variables_not_in_all_datasets,
     fill_variables_not_in_all_datasets,
 )
diff --git a/argopy/tests/test_utilities.py b/argopy/tests/test_utilities.py
index 8ccd8d46..508c617f 100644
--- a/argopy/tests/test_utilities.py
+++ b/argopy/tests/test_utilities.py
@@ -1,5 +1,4 @@
 import os
-import io
 import pytest
 import tempfile
 import xarray as xr
@@ -12,12 +11,9 @@
     linear_interpolation_remap,
     format_oneline,
     wmo2box,
-    modified_environ,
     wrap_longitude,
     toYearFraction, YearFraction_to_datetime,
     argo_split_path,
-    Registry,
-    float_wmo,
     get_coriolis_profile_id,
     get_ea_profile_page,
 )
@@ -35,182 +31,5 @@
 from mocked_http import mocked_httpserver, mocked_server_address
 
 
-@pytest.mark.parametrize("conda", [False, True],
-                         indirect=False,
-                         ids=["conda=%s" % str(p) for p in [False, True]])
-def test_show_versions(conda):
-    f = io.StringIO()
-    argopy.show_versions(file=f, conda=conda)
-    assert "SYSTEM" in f.getvalue()
-
-
-class Test_linear_interpolation_remap:
-    @pytest.fixture(autouse=True)
-    def create_data(self):
-        # create fake data to test interpolation:
-        temp = np.random.rand(200, 100)
-        pres = np.sort(
-            np.floor(
-                np.zeros([200, 100])
-                + np.linspace(50, 950, 100)
-                + np.random.randint(-5, 5, [200, 100])
-            )
-        )
-        self.dsfake = xr.Dataset(
-            {
-                "TEMP": (["N_PROF", "N_LEVELS"], temp),
-                "PRES": (["N_PROF", "N_LEVELS"], pres),
-            },
-            coords={
-                "N_PROF": ("N_PROF", range(200)),
-                "N_LEVELS": ("N_LEVELS", range(100)),
-                "Z_LEVELS": ("Z_LEVELS", np.arange(100, 900, 20)),
-            },
-        )
-
-    def test_interpolation(self):
-        # Run it with success:
-        dsi = linear_interpolation_remap(
-            self.dsfake["PRES"],
-            self.dsfake["TEMP"],
-            self.dsfake["Z_LEVELS"],
-            z_dim="N_LEVELS",
-            z_regridded_dim="Z_LEVELS",
-        )
-        assert "remapped" in dsi.dims
-
-    def test_interpolation_1d(self):
-        # Run it with success:
-        dsi = linear_interpolation_remap(
-            self.dsfake["PRES"].isel(N_PROF=0),
-            self.dsfake["TEMP"].isel(N_PROF=0),
-            self.dsfake["Z_LEVELS"],
-            z_regridded_dim="Z_LEVELS",
-        )
-        assert "remapped" in dsi.dims
-
-    def test_error_zdim(self):
-        # Test error:
-        # catches error from _regular_interp linked to z_dim
-        with pytest.raises(RuntimeError):
-            linear_interpolation_remap(
-                self.dsfake["PRES"],
-                self.dsfake["TEMP"],
-                self.dsfake["Z_LEVELS"],
-                z_regridded_dim="Z_LEVELS",
-            )
-
-    def test_error_ds(self):
-        # Test error:
-        # catches error from linear_interpolation_remap linked to datatype
-        with pytest.raises(ValueError):
-            linear_interpolation_remap(
-                self.dsfake["PRES"],
-                self.dsfake,
-                self.dsfake["Z_LEVELS"],
-                z_dim="N_LEVELS",
-                z_regridded_dim="Z_LEVELS",
-            )
-
-
-def test_format_oneline():
-    s = "Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do eiusmod tempor incididunt ut labore et dolore"
-    assert isinstance(format_oneline(s), str)
-    assert isinstance(format_oneline(s[0:5]), str)
-    s = format_oneline(s, max_width=12)
-    assert isinstance(s, str) and len(s) == 12
-
-
-def test_modified_environ():
-    os.environ["DUMMY_ENV_ARGOPY"] = 'initial'
-    with modified_environ(DUMMY_ENV_ARGOPY='toto'):
-        assert os.environ['DUMMY_ENV_ARGOPY'] == 'toto'
-    assert os.environ['DUMMY_ENV_ARGOPY'] == 'initial'
-    os.environ.pop('DUMMY_ENV_ARGOPY')
-
-
-def test_wmo2box():
-    with pytest.raises(ValueError):
-        wmo2box(12)
-    with pytest.raises(ValueError):
-        wmo2box(8000)
-    with pytest.raises(ValueError):
-        wmo2box(2000)
-
-    def complete_box(b):
-        b2 = b.copy()
-        b2.insert(4, 0.)
-        b2.insert(5, 10000.)
-        return b2
-
-    assert is_box(complete_box(wmo2box(1212)))
-    assert is_box(complete_box(wmo2box(3324)))
-    assert is_box(complete_box(wmo2box(5402)))
-    assert is_box(complete_box(wmo2box(7501)))
-
-
-def test_wrap_longitude():
-    assert wrap_longitude(np.array([-20])) == 340
-    assert wrap_longitude(np.array([40])) == 40
-    assert np.all(np.equal(wrap_longitude(np.array([340, 20])), np.array([340, 380])))
-
-
-def test_toYearFraction():
-    assert toYearFraction(pd.to_datetime('202001010000')) == 2020
-    assert toYearFraction(pd.to_datetime('202001010000', utc=True)) == 2020
-    assert toYearFraction(pd.to_datetime('202001010000')+pd.offsets.DateOffset(years=1)) == 2021
-
-
-def test_YearFraction_to_datetime():
-    assert YearFraction_to_datetime(2020) == pd.to_datetime('202001010000')
-    assert YearFraction_to_datetime(2020+1) == pd.to_datetime('202101010000')
-
-
-class Test_argo_split_path:
-    #############
-    # UTILITIES #
-    #############
-    # src = "https://data-argo.ifremer.fr/dac"
-    src = argopy.tutorial.open_dataset("gdac")[0] + "/dac"
-    list_of_files = [
-        src + "/bodc/6901929/6901929_prof.nc",  # core / multi-profile
-        src + "/coriolis/3902131/3902131_Sprof.nc",  # bgc / synthetic multi-profile
-
-        src + "/meds/4901079/profiles/D4901079_110.nc",  # core / mono-profile / Delayed
-        src + "/aoml/13857/profiles/R13857_001.nc",  # core / mono-profile / Real
-
-        src + "/coriolis/3902131/profiles/SD3902131_001.nc",  # bgc / synthetic mono-profile / Delayed
-        src + "/coriolis/3902131/profiles/SD3902131_001D.nc",  # bgc / synthetic mono-profile / Delayed / Descent
-        src + "/coriolis/6903247/profiles/SR6903247_134.nc",  # bgc / synthetic mono-profile / Real
-        src + "/coriolis/6903247/profiles/SR6903247_134D.nc",  # bgc / synthetic mono-profile / Real / Descent
-
-        src + "/coriolis/3902131/profiles/BR3902131_001.nc",  # bgc / mono-profile / Real
-        src + "/coriolis/3902131/profiles/BR3902131_001D.nc",  # bgc / mono-profile / Real / Descent
-
-        src + "/aoml/5900446/5900446_Dtraj.nc",  # traj / Delayed
-        src + "/csio/2902696/2902696_Rtraj.nc",  # traj / Real
-
-        src + "/coriolis/3902131/3902131_BRtraj.nc",  # bgc / traj / Real
-        # src + "/coriolis/6903247/6903247_BRtraj.nc",  # bgc / traj / Real
-
-        src + "/incois/2902269/2902269_tech.nc",  # technical
-        # src + "/nmdis/2901623/2901623_tech.nc",  # technical
-
-        src + "/jma/4902252/4902252_meta.nc",  # meta-data
-        # src + "/coriolis/1900857/1900857_meta.nc",  # meta-data
-    ]
-    list_of_files = [f.replace("/", os.path.sep) for f in list_of_files]
-
-    #########
-    # TESTS #
-    #########
-
-    @pytest.mark.parametrize("file", list_of_files,
-                             indirect=False)
-    def test_argo_split_path(self, file):
-        desc = argo_split_path(file)
-        assert isinstance(desc, dict)
-        for key in ['origin', 'path', 'name', 'type', 'extension', 'wmo', 'dac']:
-            assert key in desc
 
 
diff --git a/argopy/tests/test_utils_compute.py b/argopy/tests/test_utils_compute.py
new file mode 100644
index 00000000..2806fd14
--- /dev/null
+++ b/argopy/tests/test_utils_compute.py
@@ -0,0 +1,75 @@
+import pytest
+import numpy as np
+import xarray as xr
+
+from argopy.utils.compute import linear_interpolation_remap
+
+
+class Test_linear_interpolation_remap:
+    @pytest.fixture(autouse=True)
+    def create_data(self):
+        # create fake data to test interpolation:
+        temp = np.random.rand(200, 100)
+        pres = np.sort(
+            np.floor(
+                np.zeros([200, 100])
+                + np.linspace(50, 950, 100)
+                + np.random.randint(-5, 5, [200, 100])
+            )
+        )
+        self.dsfake = xr.Dataset(
+            {
+                "TEMP": (["N_PROF", "N_LEVELS"], temp),
+                "PRES": (["N_PROF", "N_LEVELS"], pres),
+            },
+            coords={
+                "N_PROF": ("N_PROF", range(200)),
+                "N_LEVELS": ("N_LEVELS", range(100)),
+                "Z_LEVELS": ("Z_LEVELS", np.arange(100, 900, 20)),
+            },
+        )
+
+    def test_interpolation(self):
+        # Run it with success:
+        dsi = linear_interpolation_remap(
+            self.dsfake["PRES"],
+            self.dsfake["TEMP"],
+            self.dsfake["Z_LEVELS"],
+            z_dim="N_LEVELS",
+            z_regridded_dim="Z_LEVELS",
+        )
+        assert "remapped" in dsi.dims
+
+    def test_interpolation_1d(self):
+        # Run it with success:
+        dsi = linear_interpolation_remap(
+            self.dsfake["PRES"].isel(N_PROF=0),
+            self.dsfake["TEMP"].isel(N_PROF=0),
+            self.dsfake["Z_LEVELS"],
+            z_regridded_dim="Z_LEVELS",
+        )
+        assert "remapped" in dsi.dims
+
+    def test_error_zdim(self):
+        # Test error:
+        # catches error from _regular_interp linked to z_dim
+        with pytest.raises(RuntimeError):
+            linear_interpolation_remap(
+                self.dsfake["PRES"],
+                self.dsfake["TEMP"],
+                self.dsfake["Z_LEVELS"],
+                z_regridded_dim="Z_LEVELS",
+            )
+
+    def test_error_ds(self):
+        # Test error:
+        # catches error from linear_interpolation_remap linked to datatype
+        with pytest.raises(ValueError):
+            linear_interpolation_remap(
+                self.dsfake["PRES"],
+                self.dsfake,
+                self.dsfake["Z_LEVELS"],
+                z_dim="N_LEVELS",
+                z_regridded_dim="Z_LEVELS",
+            )
+
diff --git a/argopy/tests/test_utils_format.py b/argopy/tests/test_utils_format.py
new file mode 100644
index 00000000..6d3c161c
--- /dev/null
+++ b/argopy/tests/test_utils_format.py
@@ -0,0 +1,60 @@
+import os
+import pytest
+import argopy
+from argopy.utils.format import format_oneline, argo_split_path
+
+
+def test_format_oneline():
+    s = "Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do eiusmod tempor incididunt ut labore et dolore"
+    assert isinstance(format_oneline(s), str)
+    assert isinstance(format_oneline(s[0:5]), str)
+    s = format_oneline(s, max_width=12)
+    assert isinstance(s, str) and len(s) == 12
+
+
+class Test_argo_split_path:
+    #############
+    # UTILITIES #
+    #############
+    # src = "https://data-argo.ifremer.fr/dac"
+    src = argopy.tutorial.open_dataset("gdac")[0] + "/dac"
+    list_of_files = [
+        src + "/bodc/6901929/6901929_prof.nc",  # core / multi-profile
+        src + "/coriolis/3902131/3902131_Sprof.nc",  # bgc / synthetic multi-profile
+
+        src + "/meds/4901079/profiles/D4901079_110.nc",  # core / mono-profile / Delayed
+        src + "/aoml/13857/profiles/R13857_001.nc",  # core / mono-profile / Real
+
+        src + "/coriolis/3902131/profiles/SD3902131_001.nc",  # bgc / synthetic mono-profile / Delayed
+        src + "/coriolis/3902131/profiles/SD3902131_001D.nc",  # bgc / synthetic mono-profile / Delayed / Descent
+        src + "/coriolis/6903247/profiles/SR6903247_134.nc",  # bgc / synthetic mono-profile / Real
+        src + "/coriolis/6903247/profiles/SR6903247_134D.nc",  # bgc / synthetic mono-profile / Real / Descent
+
+        src + "/coriolis/3902131/profiles/BR3902131_001.nc",  # bgc / mono-profile / Real
+        src + "/coriolis/3902131/profiles/BR3902131_001D.nc",  # bgc / mono-profile / Real / Descent
+
+        src + "/aoml/5900446/5900446_Dtraj.nc",  # traj / Delayed
+        src + "/csio/2902696/2902696_Rtraj.nc",  # traj / Real
+
+        src + "/coriolis/3902131/3902131_BRtraj.nc",  # bgc / traj / Real
+        # src + "/coriolis/6903247/6903247_BRtraj.nc",  # bgc / traj / Real
+
+        src + "/incois/2902269/2902269_tech.nc",  # technical
+        # src + "/nmdis/2901623/2901623_tech.nc",  # technical
+
+        src + "/jma/4902252/4902252_meta.nc",  # meta-data
+        # src + "/coriolis/1900857/1900857_meta.nc",  # meta-data
+    ]
+    list_of_files = [f.replace("/", os.path.sep) for f in list_of_files]
+
+    #########
+    # TESTS #
+    #########
+
+    @pytest.mark.parametrize("file", list_of_files,
+                             indirect=False)
+    def test_argo_split_path(self, file):
+        desc = argo_split_path(file)
+        assert isinstance(desc, dict)
+        for key in ['origin', 'path', 'name', 'type', 'extension', 'wmo', 'dac']:
+            assert key in desc
diff --git a/argopy/tests/test_utils_geo.py b/argopy/tests/test_utils_geo.py
new file mode 100644
index 00000000..609242c9
--- /dev/null
+++ b/argopy/tests/test_utils_geo.py
@@ -0,0 +1,42 @@
+import pytest
+import numpy as np
+import pandas as pd
+from argopy.utils.geo import wmo2box, wrap_longitude, toYearFraction, YearFraction_to_datetime
+from argopy.utils.checkers import is_box
+
+
+def test_wmo2box():
+    with pytest.raises(ValueError):
+        wmo2box(12)
+    with pytest.raises(ValueError):
+        wmo2box(8000)
+    with pytest.raises(ValueError):
+        wmo2box(2000)
+
+    def complete_box(b):
+        b2 = b.copy()
+        b2.insert(4, 0.)
+        b2.insert(5, 10000.)
+        return b2
+
+    assert is_box(complete_box(wmo2box(1212)))
+    assert is_box(complete_box(wmo2box(3324)))
+    assert is_box(complete_box(wmo2box(5402)))
+    assert is_box(complete_box(wmo2box(7501)))
+
+
+def test_wrap_longitude():
+    assert wrap_longitude(np.array([-20])) == 340
+    assert wrap_longitude(np.array([40])) == 40
+    assert np.all(np.equal(wrap_longitude(np.array([340, 20])), np.array([340, 380])))
+
+
+def test_toYearFraction():
+    assert toYearFraction(pd.to_datetime('202001010000')) == 2020
+    assert toYearFraction(pd.to_datetime('202001010000', utc=True)) == 2020
+    assert toYearFraction(pd.to_datetime('202001010000')+pd.offsets.DateOffset(years=1)) == 2021
+
+
+def test_YearFraction_to_datetime():
+    assert YearFraction_to_datetime(2020) == pd.to_datetime('202001010000')
+    assert YearFraction_to_datetime(2020+1) == pd.to_datetime('202101010000')
diff --git a/argopy/tests/test_utils_locals.py b/argopy/tests/test_utils_locals.py
new file mode 100644
index 00000000..fa04418d
--- /dev/null
+++ b/argopy/tests/test_utils_locals.py
@@ -0,0 +1,22 @@
+import os
+import pytest
+import io
+import argopy
+from ..utils.locals import modified_environ
+
+
+@pytest.mark.parametrize("conda", [False, True],
+                         indirect=False,
+                         ids=["conda=%s" % str(p) for p in [False, True]])
+def test_show_versions(conda):
+    f = io.StringIO()
+    argopy.show_versions(file=f, conda=conda)
+    assert "SYSTEM" in f.getvalue()
+
+
+def test_modified_environ():
+    os.environ["DUMMY_ENV_ARGOPY"] = 'initial'
+    with modified_environ(DUMMY_ENV_ARGOPY='toto'):
+        assert os.environ['DUMMY_ENV_ARGOPY'] == 'toto'
+    assert os.environ['DUMMY_ENV_ARGOPY'] == 'initial'
+    os.environ.pop('DUMMY_ENV_ARGOPY')
diff --git a/argopy/utilities.py b/argopy/utilities.py
deleted file mode 100644
index 2a8cf81a..00000000
--- a/argopy/utilities.py
+++ /dev/null
@@ -1,1123 +0,0 @@
-#!/bin/env python
-# -*coding: UTF-8 -*-
-#
-# Disclaimer:
-# Functions get_sys_info, netcdf_and_hdf5_versions and show_versions are from:
-#   xarray/util/print_versions.py
-#
-
-import os
-import sys
-import warnings
-import urllib
-import json
-import collections
-import copy
-from functools import reduce, wraps
-from packaging import version
-import logging
-from urllib.parse import urlparse
-from typing import Union
-import inspect
-import pathlib
-import importlib
-import locale
-import platform
-import struct
-import subprocess  # nosec B404 only used without user inputs
-import contextlib
-from fsspec.core import split_protocol
-import fsspec
-from functools import lru_cache
-
-import xarray as xr
-import pandas as pd
-import numpy as np
-from scipy import interpolate
-
-import pickle  # nosec B403 only used with internal files/assets
-import shutil
-
-import threading
-from socket import gaierror
-
-import time
-import setuptools  # noqa: F401
-
-from .options import OPTIONS
-from .errors import (
-    FtpPathError,
-    InvalidFetcher,
-    InvalidFetcherAccessPoint,
-    InvalidOption,
-    InvalidDatasetStructure,
-    FileSystemHasNoCache,
-    DataNotFound,
-)
-from .utils import (
-    is_box,
-    is_list_of_strings,
-    is_wmo, check_wmo,
-    check_cyc,
-)
-from .related import (
-    ArgoNVSReferenceTables,
-)
-
-try:
-    collectionsAbc = collections.abc
-except AttributeError:
-    collectionsAbc = collections
-
-try:
-    importlib.import_module('matplotlib')  # noqa: E402
-    from matplotlib.colors import to_hex
-except ImportError:
-    pass
-
-path2assets = importlib.util.find_spec('argopy.static.assets').submodule_search_locations[0]
-
-log = logging.getLogger("argopy.utilities")
-
-
-def get_sys_info():
-    """Returns system information as a dict"""
-
-    blob = []
-
-    # get full commit hash
-    commit = None
-    if os.path.isdir(".git") and os.path.isdir("argopy"):
-        try:
-            pipe = subprocess.Popen(  # nosec No user provided input to control here
-                'git log --format="%H" -n 1'.split(" "),
-                stdout=subprocess.PIPE,
-                stderr=subprocess.PIPE,
-            )
-            so, serr = pipe.communicate()
-        except Exception:
-            pass
-        else:
-            if pipe.returncode == 0:
-                commit = so
-                try:
-                    commit = so.decode("utf-8")
-                except ValueError:
-                    pass
-                commit = commit.strip().strip('"')
-
-    blob.append(("commit", commit))
-
-    try:
-        (sysname, nodename, release, version_, machine, processor) = platform.uname()
-        blob.extend(
-            [
-                ("python", sys.version),
-                ("python-bits", struct.calcsize("P") * 8),
-                ("OS", "%s" % (sysname)),
-                ("OS-release", "%s" % (release)),
-                ("machine", "%s" % (machine)),
-                ("processor", "%s" % (processor)),
-                ("byteorder", "%s" % sys.byteorder),
-                ("LC_ALL", "%s" % os.environ.get("LC_ALL", "None")),
-                ("LANG", "%s" % os.environ.get("LANG", "None")),
-                ("LOCALE", "%s.%s" % locale.getlocale()),
-            ]
-        )
-    except Exception:
-        pass
-
-    return blob
-
-
-def netcdf_and_hdf5_versions():
-    libhdf5_version = None
-    libnetcdf_version = None
-    try:
-        import netCDF4
-
-        libhdf5_version = netCDF4.__hdf5libversion__
-        libnetcdf_version = netCDF4.__netcdf4libversion__
-    except ImportError:
-        try:
-            import h5py
-
-            libhdf5_version = h5py.version.hdf5_version
-        except ImportError:
-            pass
-    return [("libhdf5", libhdf5_version), ("libnetcdf", libnetcdf_version)]
-
-
-def show_versions(file=sys.stdout, conda=False):  # noqa: C901
-    """ Print the versions of argopy and its dependencies
-
-    Parameters
-    ----------
-    file : file-like, optional
-        print to the given file-like object. Defaults to sys.stdout.
-    conda: bool, optional
-        format versions to be copy/pasted on a conda environment file (default, False)
-    """
-    sys_info = get_sys_info()
-
-    try:
-        sys_info.extend(netcdf_and_hdf5_versions())
-    except Exception as e:
-        print(f"Error collecting netcdf / hdf5 version: {e}")
-
-    DEPS = {
-        'core': sorted([
-            ("argopy", lambda mod: mod.__version__),
-
-            ("xarray", lambda mod: mod.__version__),
-            ("scipy", lambda mod: mod.__version__),
-            ("netCDF4", lambda mod: mod.__version__),
-            ("erddapy", lambda mod: mod.__version__),  # This could go away from requirements ?
-            ("fsspec", lambda mod: mod.__version__),
-            ("aiohttp", lambda mod: mod.__version__),
-            ("packaging", lambda mod: mod.__version__),  # will come with xarray, Using 'version' to make API compatible with several fsspec releases
-            ("requests", lambda mod: mod.__version__),
-            ("toolz", lambda mod: mod.__version__),
-        ]),
-        'ext.util': sorted([
-            ("gsw", lambda mod: mod.__version__),   # Used by xarray accessor to compute new variables
-            ("tqdm", lambda mod: mod.__version__),
-            ("zarr", lambda mod: mod.__version__),
-        ]),
-        'ext.perf': sorted([
-            ("dask", lambda mod: mod.__version__),
-            ("distributed", lambda mod: mod.__version__),
-            ("pyarrow", lambda mod: mod.__version__),
-        ]),
-        'ext.plot': sorted([
-            ("matplotlib", lambda mod: mod.__version__),
-            ("cartopy", lambda mod: mod.__version__),
-            ("seaborn", lambda mod: mod.__version__),
-            ("IPython", lambda mod: mod.__version__),
-            ("ipywidgets", lambda mod: mod.__version__),
-            ("ipykernel", lambda mod: mod.__version__),
-        ]),
-        'dev': sorted([
-
-            ("bottleneck", lambda mod: mod.__version__),
-            ("cftime", lambda mod: mod.__version__),
-            ("cfgrib", lambda mod: mod.__version__),
-            ("conda", lambda mod: mod.__version__),
-            ("nc_time_axis", lambda mod: mod.__version__),
-
-            ("numpy", lambda mod: mod.__version__),  # will come with xarray and pandas
-            ("pandas", lambda mod: mod.__version__),  # will come with xarray
-
-            ("pip", lambda mod: mod.__version__),
-            ("black", lambda mod: mod.__version__),
-            ("flake8", lambda mod: mod.__version__),
-            ("pytest", lambda mod: mod.__version__),  # will come with pandas
-            ("pytest_env", lambda mod: mod.__version__),  # will come with pandas
-            ("pytest_cov", lambda mod: mod.__version__),  # will come with pandas
-            ("pytest_localftpserver", lambda mod: mod.__version__),  # will come with pandas
-            ("pytest_reportlog", lambda mod: mod.__version__),  # will come with pandas
-            ("setuptools", lambda mod: mod.__version__),
-            ("aiofiles", lambda mod: mod.__version__),
-            ("sphinx", lambda mod: mod.__version__),
-        ]),
-    }
-
-    DEPS_blob = {}
-    for level in DEPS.keys():
-        deps = DEPS[level]
-        deps_blob = list()
-        for (modname, ver_f) in deps:
-            try:
-                if modname in sys.modules:
-                    mod = sys.modules[modname]
-                else:
-                    mod = importlib.import_module(modname)
-            except Exception:
-                deps_blob.append((modname, '-'))
-            else:
-                try:
-                    ver = ver_f(mod)
-                    deps_blob.append((modname, ver))
-                except Exception:
-                    deps_blob.append((modname, "installed"))
-        DEPS_blob[level] = deps_blob
-
-    print("\nSYSTEM", file=file)
-    print("------", file=file)
-    for k, stat in sys_info:
-        print(f"{k}: {stat}", file=file)
-
-    for level in DEPS_blob:
-        if conda:
-            print("\n# %s:" % level.upper(), file=file)
-        else:
-            title = "INSTALLED VERSIONS: %s" % level.upper()
-            print("\n%s" % title, file=file)
-            print("-" * len(title), file=file)
-        deps_blob = DEPS_blob[level]
-        for k, stat in deps_blob:
-            if conda:
-                if k != 'argopy':
-                    kf = k.replace("_", "-")
-                    comment = ' ' if stat != '-' else '# '
-                    print(f"{comment} - {kf} = {stat}", file=file)  # Format like a conda env line, useful to update ci/requirements
-            else:
-                print("{:<12}: {:<12}".format(k, stat), file=file)
-
-
-def show_options(file=sys.stdout):  # noqa: C901
-    """ Print options of argopy
-
-    Parameters
-    ----------
-    file : file-like, optional
-        print to the given file-like object. Defaults to sys.stdout.
-    """
-    print("\nARGOPY OPTIONS", file=file)
-    print("--------------", file=file)
-    opts = copy.deepcopy(OPTIONS)
-    opts = dict(sorted(opts.items()))
-    for k, v in opts.items():
-        print(f"{k}: {v}", file=file)
-
-
-def badge(label="label", message="message", color="green", insert=False):
-    """ Return or insert shield.io badge image
-
-        Use the shields.io service to create a badge image
-
-        https://img.shields.io/static/v1?label=<LABEL>&message=<MESSAGE>&color=<COLOR>
-
-    Parameters
-    ----------
-    label: str
-        Left side badge text
-    message: str
-        Right side badge text
-    color: str
-        Right side background color
-    insert: bool
-        Return url to badge image (False, default) or directly insert the image with HTML (True)
-
-    Returns
-    -------
-    str or IPython.display.Image
-    """
-    from IPython.display import Image
-
-    url = (
-        "https://img.shields.io/static/v1?style=flat-square&label={}&message={}&color={}"
-    ).format
-    img = url(urllib.parse.quote(label), urllib.parse.quote(message), color)
-    if not insert:
-        return img
-    else:
-        return Image(url=img)
-
-
-class fetch_status:
-    """Fetch and report web API status"""
-
-    def __init__(self, **kwargs):
-        if "stdout" in kwargs or "insert" in kwargs:
-            warnings.warn("'fetch_status' signature has changed")
-        pass
-
-    def fetch(self):
-        results = {}
-        list_src = list_available_data_src()
-        for api, mod in list_src.items():
-            if getattr(mod, "api_server_check", None):
-                status = isAPIconnected(api)
-                message = "ok" if status else "offline"
-                results[api] = {"value": status, "message": message}
-        return results
-
-    @property
-    def text(self):
-        results = self.fetch()
-        rows = []
-        for api in sorted(results.keys()):
-            rows.append("src %s is: %s" % (api, results[api]["message"]))
-        txt = " | ".join(rows)
-        return txt
-
-    def __repr__(self):
-        return self.text
-
-    @property
-    def html(self):
-        results = self.fetch()
-
-        fs = 12
-
-        def td_msg(bgcolor, txtcolor, txt):
-            style = "background-color:%s;" % to_hex(bgcolor, keep_alpha=True)
-            style += "border-width:0px;"
-            style += "padding: 2px 5px 2px 5px;"
-            style += "text-align:left;"
-            style += "color:%s" % to_hex(txtcolor, keep_alpha=True)
-            return "<td style='%s'>%s</td>" % (style, str(txt))
-
-        td_empty = "<td style='border-width:0px;padding: 2px 5px 2px 5px;text-align:left'>&nbsp;</td>"
-
-        html = []
-        html.append("<table style='border-collapse:collapse;border-spacing:0;font-size:%ipx'>" % fs)
-        html.append("<tbody><tr>")
-        cols = []
-        for api in sorted(results.keys()):
-            color = "yellowgreen" if results[api]["value"] else "darkorange"
-            cols.append(td_msg('dimgray', 'w', "src %s is" % api))
-            cols.append(td_msg(color, 'w', results[api]["message"]))
-            cols.append(td_empty)
-        html.append("\n".join(cols))
-        html.append("</tr></tbody>")
-        html.append("</table>")
-        html = "\n".join(html)
-        return html
-
-    def _repr_html_(self):
-        return self.html
-
-
-class monitor_status:
-    """ Monitor data source status with a refresh rate """
-
-    def __init__(self, refresh=60):
-        self.refresh_rate = refresh
-
-        if self.runner == 'notebook':
-            import ipywidgets as widgets
-
-            self.text = widgets.HTML(
-                value=self.content,
-                placeholder="",
-                description="",
-            )
-            self.start()
-
-    def __repr__(self):
-        if self.runner != 'notebook':
-            return self.content
-        else:
-            return ""
-
-    @property
-    def runner(self) -> str:
-        try:
-            shell = get_ipython().__class__.__name__
-            if shell == 'ZMQInteractiveShell':
-                return 'notebook'  # Jupyter notebook or qtconsole
-            elif shell == 'TerminalInteractiveShell':
-                return 'terminal'  # Terminal running IPython
-            else:
-                return False  # Other type (?)
-        except NameError:
-            return 'standard'  # Probably standard Python interpreter
-
-    @property
-    def content(self):
-        if self.runner == 'notebook':
-            return fetch_status().html
-        else:
-            return fetch_status().text
-
-    def work(self):
-        while True:
-            time.sleep(self.refresh_rate)
-            self.text.value = self.content
-
-    def start(self):
-        from IPython.display import display
-
-        thread = threading.Thread(target=self.work)
-        display(self.text)
-        thread.start()
-
-
-#
-#  From xarrayutils : https://github.com/jbusecke/xarrayutils/blob/master/xarrayutils/vertical_coordinates.py
-#  Direct integration of those 2 functions to minimize dependencies and possibility of tuning them to our needs
-#
-
-
-def linear_interpolation_remap(
-    z, data, z_regridded, z_dim=None, z_regridded_dim="regridded", output_dim="remapped"
-):
-
-    # interpolation called in xarray ufunc
-    def _regular_interp(x, y, target_values):
-        # remove all nans from input x and y
-        idx = np.logical_or(np.isnan(x), np.isnan(y))
-        x = x[~idx]
-        y = y[~idx]
-
-        # Need at least 5 points in the profile to interpolate, otherwise, return NaNs
-        if len(y) < 5:
-            interpolated = np.empty(len(target_values))
-            interpolated[:] = np.nan
-        else:
-            # replace nans in target_values with out of bound Values (just in case)
-            target_values = np.where(
-                ~np.isnan(target_values), target_values, np.nanmax(x) + 1
-            )
-            # Interpolate with fill value parameter to extend min pressure toward 0
-            interpolated = interpolate.interp1d(
-                x, y, bounds_error=False, fill_value=(y[0], y[-1])
-            )(target_values)
-        return interpolated
-
-    # infer dim from input
-    if z_dim is None:
-        if len(z.dims) != 1:
-            raise RuntimeError("if z_dim is not specified, x must be a 1D array.")
-        dim = z.dims[0]
-    else:
-        dim = z_dim
-
-    # if dataset is passed drop all data_vars that dont contain dim
-    if isinstance(data, xr.Dataset):
-        raise ValueError("Dataset input is not supported yet")
-        # TODO: for a dataset input just apply the function for each appropriate array
-
-    if version.parse(xr.__version__) > version.parse("0.15.0"):
-        kwargs = dict(
-            input_core_dims=[[dim], [dim], [z_regridded_dim]],
-            output_core_dims=[[output_dim]],
-            vectorize=True,
-            dask="parallelized",
-            output_dtypes=[data.dtype],
-            dask_gufunc_kwargs={
-                "output_sizes": {output_dim: len(z_regridded[z_regridded_dim])}
-            },
-        )
-    else:
-        kwargs = dict(
-            input_core_dims=[[dim], [dim], [z_regridded_dim]],
-            output_core_dims=[[output_dim]],
-            vectorize=True,
-            dask="parallelized",
-            output_dtypes=[data.dtype],
-            output_sizes={output_dim: len(z_regridded[z_regridded_dim])},
-        )
-    remapped = xr.apply_ufunc(_regular_interp, z, data, z_regridded, **kwargs)
-
-    remapped.coords[output_dim] = z_regridded.rename(
-        {z_regridded_dim: output_dim}
-    ).coords[output_dim]
-    return remapped
-
-
-
-def format_oneline(s, max_width=65):
-    """ Return a string formatted for a line print """
-    if len(s) > max_width:
-        padding = " ... "
-        n = (max_width - len(padding)) // 2
-        q = (max_width - len(padding)) % 2
-        if q == 0:
-            return "".join([s[0: n], padding, s[-n:]])
-        else:
-            return "".join([s[0: n + 1], padding, s[-n:]])
-    else:
-        return s
-
-
-def warnUnless(ok, txt):
-    """Function to raise a warning unless condition is True
-
-    This function IS NOT to be used as a decorator anymore
-
-    Parameters
-    ----------
-    ok: bool
-        Condition to raise the warning or not
-    txt: str
-        Text to display in the warning
-    """
-    if not ok:
-        msg = "%s %s" % (inspect.stack()[1].function, txt)
-        warnings.warn(msg)
-
-
-@contextlib.contextmanager
-def modified_environ(*remove, **update):
-    """
-    Temporarily updates the ``os.environ`` dictionary in-place.
-
-    The ``os.environ`` dictionary is updated in-place so that the modification
-    is sure to work in all situations.
-
-    :param remove: Environment variables to remove.
-    :param update: Dictionary of environment variables and values to add/update.
-    """
-    # Source: https://github.com/laurent-laporte-pro/stackoverflow-q2059482
-    env = os.environ
-    update = update or {}
-    remove = remove or []
-
-    # List of environment variables being updated or removed.
-    stomped = (set(update.keys()) | set(remove)) & set(env.keys())
-    # Environment variables and values to restore on exit.
-    update_after = {k: env[k] for k in stomped}
-    # Environment variables and values to remove on exit.
-    remove_after = frozenset(k for k in update if k not in env)
-
-    try:
-        env.update(update)
-        [env.pop(k, None) for k in remove]
-        yield
-    finally:
-        env.update(update_after)
-        [env.pop(k) for k in remove_after]
-
-
-def toYearFraction(
-    this_date: pd._libs.tslibs.timestamps.Timestamp = pd.to_datetime("now", utc=True)
-):
-    """ Compute decimal year, robust to leap years, precision to the second
-
-    Compute the fraction of the year a given timestamp corresponds to.
-    The "fraction of the year" goes:
-    - from 0 on 01-01T00:00:00.000 of the year
-    - to 1 on the 01-01T00:00:00.000 of the following year
-
-    1 second corresponds to the number of days in the year times 86400.
-    The faction of the year is rounded to 10-digits in order to have a "second" precision.
-
-    See discussion here: https://github.com/euroargodev/argodmqc_owc/issues/35
-
-    Parameters
-    ----------
-    pd._libs.tslibs.timestamps.Timestamp
-
-    Returns
-    -------
-    float
-    """
-    if "UTC" in [this_date.tzname() if this_date.tzinfo is not None else ""]:
-        startOfThisYear = pd.to_datetime("%i-01-01T00:00:00.000" % this_date.year, utc=True)
-    else:
-        startOfThisYear = pd.to_datetime("%i-01-01T00:00:00.000" % this_date.year)
-    yearDuration_sec = (
-        startOfThisYear + pd.offsets.DateOffset(years=1) - startOfThisYear
-    ).total_seconds()
-
-    yearElapsed_sec = (this_date - startOfThisYear).total_seconds()
-    fraction = yearElapsed_sec / yearDuration_sec
-    fraction = np.round(fraction, 10)
-    return this_date.year + fraction
-
-
-def YearFraction_to_datetime(yf: float):
-    """ Compute datetime from year fraction
-
-    Inverse the toYearFraction() function
-
-    Parameters
-    ----------
-    float
-
-    Returns
-    -------
-    pd._libs.tslibs.timestamps.Timestamp
-    """
-    year = np.int32(yf)
-    fraction = yf - year
-    fraction = np.round(fraction, 10)
-
-    startOfThisYear = pd.to_datetime("%i-01-01T00:00:00" % year)
-    yearDuration_sec = (
-        startOfThisYear + pd.offsets.DateOffset(years=1) - startOfThisYear
-    ).total_seconds()
-    yearElapsed_sec = pd.Timedelta(fraction * yearDuration_sec, unit="s")
-    return pd.to_datetime(startOfThisYear + yearElapsed_sec, unit="s")
-
-
-def wrap_longitude(grid_long):
-    """ Allows longitude (0-360) to wrap beyond the 360 mark, for mapping purposes.
-        Makes sure that, if the longitude is near the boundary (0 or 360) that we
-        wrap the values beyond
-        360 so it appears nicely on a map
-        This is a refactor between get_region_data and get_region_hist_locations to
-        avoid duplicate code
-
-        source:
-        https://github.com/euroargodev/argodmqc_owc/blob/e174f4538fdae1534c9740491398972b1ffec3ca/pyowc/utilities.py#L80
-
-        Parameters
-        ----------
-        grid_long: array of longitude values
-
-        Returns
-        -------
-        array of longitude values that can extend past 360
-    """
-    neg_long = np.argwhere(grid_long < 0)
-    grid_long[neg_long] = grid_long[neg_long] + 360
-
-    # if we have data close to upper boundary (360), then wrap some of the data round
-    # so it appears on the map
-    top_long = np.argwhere(grid_long >= 320)
-    if top_long.__len__() != 0:
-        bottom_long = np.argwhere(grid_long <= 40)
-        grid_long[bottom_long] = 360 + grid_long[bottom_long]
-
-    return grid_long
-
-
-def wmo2box(wmo_id: int):
-    """ Convert WMO square box number into a latitude/longitude box
-
-    See:
-    https://en.wikipedia.org/wiki/World_Meteorological_Organization_squares
-    https://commons.wikimedia.org/wiki/File:WMO-squares-global.gif
-
-    Parameters
-    ----------
-    wmo_id: int
-        WMO square number, must be between 1000 and 7817
-
-    Returns
-    -------
-    box: list(int)
-        [lon_min, lon_max, lat_min, lat_max] bounds to the WMO square number
-    """
-    if wmo_id < 1000 or wmo_id > 7817:
-        raise ValueError("Invalid WMO square number, must be between 1000 and 7817.")
-    wmo_id = str(wmo_id)
-
-    # "global quadrant" numbers where 1=NE, 3=SE, 5=SW, 7=NW
-    quadrant = int(wmo_id[0])
-    if quadrant not in [1, 3, 5, 7]:
-        raise ValueError("Invalid WMO square number, 1st digit must be 1, 3, 5 or 7.")
-
-    # 'minimum' Latitude square boundary, nearest to the Equator
-    nearest_to_the_Equator_latitude = int(wmo_id[1])
-
-    # 'minimum' Longitude square boundary, nearest to the Prime Meridian
-    nearest_to_the_Prime_Meridian = int(wmo_id[2:4])
-
-    #
-    dd = 10
-    if quadrant in [1, 3]:
-        lon_min = nearest_to_the_Prime_Meridian * dd
-        lon_max = nearest_to_the_Prime_Meridian * dd + dd
-    elif quadrant in [5, 7]:
-        lon_min = -nearest_to_the_Prime_Meridian * dd - dd
-        lon_max = -nearest_to_the_Prime_Meridian * dd
-
-    if quadrant in [1, 7]:
-        lat_min = nearest_to_the_Equator_latitude * dd
-        lat_max = nearest_to_the_Equator_latitude * dd + dd
-    elif quadrant in [3, 5]:
-        lat_min = -nearest_to_the_Equator_latitude * dd - dd
-        lat_max = -nearest_to_the_Equator_latitude * dd
-
-    box = [lon_min, lon_max, lat_min, lat_max]
-    return box
-
-
-def groupby_remap(z, data, z_regridded,   # noqa C901
-                  z_dim=None,
-                  z_regridded_dim="regridded",
-                  output_dim="remapped",
-                  select='deep',
-                  right=False):
-    """ todo: Need a docstring here !"""
-
-    # sub-sampling called in xarray ufunc
-    def _subsample_bins(x, y, target_values):
-        # remove all nans from input x and y
-        try:
-            idx = np.logical_or(np.isnan(x), np.isnan(y))
-        except TypeError:
-            log.debug("Error with this '%s' y data content: %s" % (type(y), str(np.unique(y))))
-            raise
-        x = x[~idx]
-        y = y[~idx]
-
-        ifound = np.digitize(
-            x, target_values, right=right
-        )  # ``bins[i-1] <= x < bins[i]``
-        ifound -= 1  # Because digitize returns a 1-based indexing, we need to remove 1
-        y_binned = np.ones_like(target_values) * np.nan
-
-        for ib, this_ibin in enumerate(np.unique(ifound)):
-            ix = np.where(ifound == this_ibin)
-            iselect = ix[-1]
-
-            # Map to y value at specific x index in the bin:
-            if select == "shallow":
-                iselect = iselect[0]  # min/shallow
-                mapped_value = y[iselect]
-            elif select == "deep":
-                iselect = iselect[-1]  # max/deep
-                mapped_value = y[iselect]
-            elif select == "middle":
-                iselect = iselect[
-                    np.where(x[iselect] >= np.median(x[iselect]))[0][0]
-                ]  # median/middle
-                mapped_value = y[iselect]
-            elif select == "random":
-                iselect = iselect[np.random.randint(len(iselect))]
-                mapped_value = y[iselect]
-
-            # or Map to y statistics in the bin:
-            elif select == "mean":
-                mapped_value = np.nanmean(y[iselect])
-            elif select == "min":
-                mapped_value = np.nanmin(y[iselect])
-            elif select == "max":
-                mapped_value = np.nanmax(y[iselect])
-            elif select == "median":
-                mapped_value = np.median(y[iselect])
-
-            else:
-                raise InvalidOption("`select` option has invalid value (%s)" % select)
-
-            y_binned[this_ibin] = mapped_value
-
-        return y_binned
-
-    # infer dim from input
-    if z_dim is None:
-        if len(z.dims) != 1:
-            raise RuntimeError("if z_dim is not specified, x must be a 1D array.")
-        dim = z.dims[0]
-    else:
-        dim = z_dim
-
-    # if dataset is passed drop all data_vars that don't contain dim
-    if isinstance(data, xr.Dataset):
-        raise ValueError("Dataset input is not supported yet")
-        # TODO: for a dataset input just apply the function for each appropriate array
-
-    if version.parse(xr.__version__) > version.parse("0.15.0"):
-        kwargs = dict(
-            input_core_dims=[[dim], [dim], [z_regridded_dim]],
-            output_core_dims=[[output_dim]],
-            vectorize=True,
-            dask="parallelized",
-            output_dtypes=[data.dtype],
-            dask_gufunc_kwargs={
-                "output_sizes": {output_dim: len(z_regridded[z_regridded_dim])}
-            },
-        )
-    else:
-        kwargs = dict(
-            input_core_dims=[[dim], [dim], [z_regridded_dim]],
-            output_core_dims=[[output_dim]],
-            vectorize=True,
-            dask="parallelized",
-            output_dtypes=[data.dtype],
-            output_sizes={output_dim: len(z_regridded[z_regridded_dim])},
-        )
-    remapped = xr.apply_ufunc(_subsample_bins, z, data, z_regridded, **kwargs)
-
-    remapped.coords[output_dim] = z_regridded.rename(
-        {z_regridded_dim: output_dim}
-    ).coords[output_dim]
-    return remapped
-
-
-def argo_split_path(this_path):  # noqa C901
-    """ Split path from a GDAC ftp style Argo netcdf file and return information
-
-    >>> argo_split_path('coriolis/6901035/profiles/D6901035_001D.nc')
-    >>> argo_split_path('https://data-argo.ifremer.fr/dac/csiro/5903939/profiles/D5903939_103.nc')
-
-    Parameters
-    ----------
-    str
-
-    Returns
-    -------
-    dict
-    """
-    dacs = [
-        "aoml",
-        "bodc",
-        "coriolis",
-        "csio",
-        "csiro",
-        "incois",
-        "jma",
-        "kma",
-        "kordi",
-        "meds",
-        "nmdis",
-    ]
-    output = {}
-
-    start_with = lambda f, x: f[0:len(x)] == x if len(x) <= len(f) else False  # noqa: E731
-
-    def split_path(p, sep='/'):
-        """Split a pathname.  Returns tuple "(head, tail)" where "tail" is
-        everything after the final slash.  Either part may be empty."""
-        # Same as posixpath.py but we get to choose the file separator !
-        p = os.fspath(p)
-        i = p.rfind(sep) + 1
-        head, tail = p[:i], p[i:]
-        if head and head != sep * len(head):
-            head = head.rstrip(sep)
-        return head, tail
-
-    def fix_localhost(host):
-        if 'ftp://localhost:' in host:
-            return "ftp://%s" % (urlparse(host).netloc)
-        if 'http://127.0.0.1:' in host:
-            return "http://%s" % (urlparse(host).netloc)
-        else:
-            return ""
-
-    known_origins = ['https://data-argo.ifremer.fr',
-                     'ftp://ftp.ifremer.fr/ifremer/argo',
-                     'ftp://usgodae.org/pub/outgoing/argo',
-                     fix_localhost(this_path),
-                     '']
-
-    output['origin'] = [origin for origin in known_origins if start_with(this_path, origin)][0]
-    output['origin'] = '.' if output['origin'] == '' else output['origin'] + '/'
-    sep = '/' if output['origin'] != '.' else os.path.sep
-
-    (path, file) = split_path(this_path, sep=sep)
-
-    output['path'] = path.replace(output['origin'], '')
-    output['name'] = file
-
-    # Deal with the path:
-    # dac/<DAC>/<FloatWmoID>/
-    # dac/<DAC>/<FloatWmoID>/profiles
-    path_parts = path.split(sep)
-
-    try:
-        if path_parts[-1] == 'profiles':
-            output['type'] = 'Mono-cycle profile file'
-            output['wmo'] = path_parts[-2]
-            output['dac'] = path_parts[-3]
-        else:
-            output['type'] = 'Multi-cycle profile file'
-            output['wmo'] = path_parts[-1]
-            output['dac'] = path_parts[-2]
-    except Exception:
-        log.warning(this_path)
-        log.warning(path)
-        log.warning(sep)
-        log.warning(path_parts)
-        log.warning(output)
-        raise
-
-    if output['dac'] not in dacs:
-        log.debug("This is not a Argo GDAC compliant file path: %s" % path)
-        log.warning(this_path)
-        log.warning(path)
-        log.warning(sep)
-        log.warning(path_parts)
-        log.warning(output)
-        raise ValueError("This is not a Argo GDAC compliant file path (invalid DAC name: '%s')" % output['dac'])
-
-    # Deal with the file name:
-    filename, file_extension = os.path.splitext(output['name'])
-    output['extension'] = file_extension
-    if file_extension != '.nc':
-        raise ValueError(
-            "This is not a Argo GDAC compliant file path (invalid file extension: '%s')" % file_extension)
-    filename_parts = output['name'].split("_")
-
-    if "Mono" in output['type']:
-        prefix = filename_parts[0].split(output['wmo'])[0]
-        if 'R' in prefix:
-            output['data_mode'] = 'R, Real-time data'
-        if 'D' in prefix:
-            output['data_mode'] = 'D, Delayed-time data'
-
-        if 'S' in prefix:
-            output['type'] = 'S, Synthetic BGC Mono-cycle profile file'
-        if 'M' in prefix:
-            output['type'] = 'M, Merged BGC Mono-cycle profile file'
-        if 'B' in prefix:
-            output['type'] = 'B, BGC Mono-cycle profile file'
-
-        suffix = filename_parts[-1].split(output['wmo'])[-1]
-        if 'D' in suffix:
-            output['direction'] = 'D, descending profiles'
-        elif suffix == "" and "Mono" in output['type']:
-            output['direction'] = 'A, ascending profiles (implicit)'
-
-    else:
-        typ = filename_parts[-1].split(".nc")[0]
-        if typ == 'prof':
-            output['type'] = 'Multi-cycle file'
-        if typ == 'Sprof':
-            output['type'] = 'S, Synthetic BGC Multi-cycle profiles file'
-        if typ == 'tech':
-            output['type'] = 'Technical data file'
-        if typ == 'meta':
-            output['type'] = 'Metadata file'
-        if 'traj' in typ:
-            # possible typ = [Rtraj, Dtraj, BRtraj, BDtraj]
-            output['type'], i = 'Trajectory file', 0
-            if typ[0] == 'B':
-                output['type'], i = 'BGC Trajectory file', 1
-            if typ.split("traj")[0][i] == 'D':
-                output['data_mode'] = 'D, Delayed-time data'
-            elif typ.split("traj")[0][i] == 'R':
-                output['data_mode'] = 'R, Real-time data'
-            else:
-                output['data_mode'] = 'R, Real-time data (implicit)'
-
-    # Adjust origin and path for local files:
-    # This ensure that output['path'] is agnostic to users and can be reused on any gdac compliant architecture
-    parts = path.split(sep)
-    i, stop = len(parts) - 1, False
-    while not stop:
-        if parts[i] == 'profiles' or parts[i] == output['wmo'] or parts[i] == output['dac'] or parts[i] == 'dac':
-            i = i - 1
-            if i < 0:
-                stop = True
-        else:
-            stop = True
-    output['origin'] = sep.join(parts[0:i + 1])
-    output['path'] = output['path'].replace(output['origin'], '')
-
-    return dict(sorted(output.items()))
-
-
-def log_argopy_callerstack(level='debug'):
-    """log the caller’s stack"""
-    froot = str(pathlib.Path(__file__).parent.resolve())
-    for ideep, frame in enumerate(inspect.stack()[1:]):
-        if os.path.join('argopy', 'argopy') in frame.filename:
-            # msg = ["└─"]
-            # [msg.append("─") for ii in range(ideep)]
-            msg = [""]
-            [msg.append("  ") for ii in range(ideep)]
-            msg.append("└─ %s:%i -> %s" % (frame.filename.replace(froot, ''), frame.lineno, frame.function))
-            msg = "".join(msg)
-            if level == "info":
-                log.info(msg)
-            elif level == "debug":
-                log.debug(msg)
-            elif level == "warning":
-                log.warning(msg)
-
-
-def drop_variables_not_in_all_datasets(ds_collection):
-    """Drop variables that are not in all datasets (the lowest common denominator)
-
-    Parameters
-    ----------
-    list of :class:`xr.DataSet`
-
-    Returns
-    -------
-    list of :class:`xr.DataSet`
-    """
-
-    # List all possible data variables:
-    vlist = []
-    for res in ds_collection:
-        [vlist.append(v) for v in list(res.data_vars)]
-    vlist = np.unique(vlist)
-
-    # Check if each variables are in each datasets:
-    ishere = np.zeros((len(vlist), len(ds_collection)))
-    for ir, res in enumerate(ds_collection):
-        for iv, v in enumerate(res.data_vars):
-            for iu, u in enumerate(vlist):
-                if v == u:
-                    ishere[iu, ir] = 1
-
-    # List of dataset with missing variables:
-    # ir_missing = np.sum(ishere, axis=0) < len(vlist)
-    # List of variables missing in some dataset:
-    iv_missing = np.sum(ishere, axis=1) < len(ds_collection)
-    if len(iv_missing) > 0:
-        log.debug("Dropping these variables that are missing from some dataset in this list: %s" % vlist[iv_missing])
-
-    # List of variables to keep
-    iv_tokeep = np.sum(ishere, axis=1) == len(ds_collection)
-    for ir, res in enumerate(ds_collection):
-        #         print("\n", res.attrs['Fetched_uri'])
-        v_to_drop = []
-        for iv, v in enumerate(res.data_vars):
-            if v not in vlist[iv_tokeep]:
-                v_to_drop.append(v)
-        ds_collection[ir] = ds_collection[ir].drop_vars(v_to_drop)
-    return ds_collection
-
-
-def fill_variables_not_in_all_datasets(ds_collection, concat_dim='rows'):
-    """Add empty variables to dataset so that all the collection have the same data_vars and coords
-
-    This is to make sure that the collection of dataset can be concatenated
-
-    Parameters
-    ----------
-    list of :class:`xr.DataSet`
-
-    Returns
-    -------
-    list of :class:`xr.DataSet`
-    """
-    def first_variable_with_concat_dim(this_ds, concat_dim='rows'):
-        """Return the 1st variable in the collection that have the concat_dim in dims"""
-        first = None
-        for v in this_ds.data_vars:
-            if concat_dim in this_ds[v].dims:
-                first = v
-                pass
-        return first
-
-    def fillvalue(da):
-        """ Return fillvalue for a dataarray """
-        # https://docs.scipy.org/doc/numpy/reference/generated/numpy.dtype.kind.html#numpy.dtype.kind
-        if da.dtype.kind in ["U"]:
-            fillvalue = " "
-        elif da.dtype.kind == "i":
-            fillvalue = 99999
-        elif da.dtype.kind == "M":
-            fillvalue = np.datetime64("NaT")
-        else:
-            fillvalue = np.nan
-        return fillvalue
-
-    # List all possible data variables:
-    vlist = []
-    for res in ds_collection:
-        [vlist.append(v) for v in list(res.variables) if concat_dim in res[v].dims]
-    vlist = np.unique(vlist)
-    # log.debug('variables', vlist)
-
-    # List all possible coordinates:
-    clist = []
-    for res in ds_collection:
-        [clist.append(c) for c in list(res.coords) if concat_dim in res[c].dims]
-    clist = np.unique(clist)
-    # log.debu('coordinates', clist)
-
-    # Get the first occurrence of each variable, to be used as a template for attributes and dtype
-    meta = {}
-    for ir, ds in enumerate(ds_collection):
-        for v in vlist:
-            if v in ds.variables:
-                meta[v] = {'attrs': ds[v].attrs, 'dtype': ds[v].dtype, 'fill_value': fillvalue(ds[v])}
-    # [log.debug(meta[m]) for m in meta.keys()]
-
-    # Add missing variables to dataset
-    datasets = [ds.copy() for ds in ds_collection]
-    for ir, ds in enumerate(datasets):
-        for v in vlist:
-            if v not in ds.variables:
-                like = ds[first_variable_with_concat_dim(ds, concat_dim=concat_dim)]
-                datasets[ir][v] = xr.full_like(like, fill_value=meta[v]['fill_value'], dtype=meta[v]['dtype'])
-                datasets[ir][v].attrs = meta[v]['attrs']
-
-    # Make sure that all datasets have the same set of coordinates
-    results = []
-    for ir, ds in enumerate(datasets):
-        results.append(datasets[ir].set_coords(clist))
-
-    #
-    return results
diff --git a/argopy/utils/__init__.py b/argopy/utils/__init__.py
index 69f2bb23..d1f74d67 100644
--- a/argopy/utils/__init__.py
+++ b/argopy/utils/__init__.py
@@ -20,6 +20,12 @@
 from .monitored_threadpool import MyThreadPoolExecutor as MonitoredThreadPoolExecutor
 from .chunking import Chunker
 from .accessories import Registry, float_wmo
+from .locals import show_versions, show_options, modified_environ
+from .monitors import monitor_status
+from .geo import wmo2box, wrap_longitude, toYearFraction, YearFraction_to_datetime
+from .compute import linear_interpolation_remap, groupby_remap
+from .manip import fill_variables_not_in_all_datasets, drop_variables_not_in_all_datasets
+from .format import argo_split_path, format_oneline
 
 
 __all__ = (
@@ -55,5 +61,31 @@
     "Chunker",
 
     # Accessories classes (specific objects):
-    "Registry", "float_wmo"
+    "Registry", "float_wmo",
+
+    # Locals (environments, versions, systems):
+    "show_versions",
+    "show_options",
+    "modified_environ",
+
+    # Monitors
+    "monitor_status",
+
+    # Geo (space/time data utilities)
+    "wmo2box",
+    "wrap_longitude",
+    "toYearFraction",
+    "YearFraction_to_datetime",
+
+    # Computation with datasets:
+    "linear_interpolation_remap",
+    "groupby_remap",
+
+    # Manipulate datasets:
+    "fill_variables_not_in_all_datasets",
+    "drop_variables_not_in_all_datasets",
+
+    # Formatters:
+    "format_oneline",
+    "argo_split_path",
 )
diff --git a/argopy/utils/compute.py b/argopy/utils/compute.py
new file mode 100644
index 00000000..6209034c
--- /dev/null
+++ b/argopy/utils/compute.py
@@ -0,0 +1,193 @@
+import numpy as np
+from scipy import interpolate
+import xarray as xr
+from packaging import version
+import logging
+from ..errors import InvalidOption
+
+log = logging.getLogger("argopy.utils.compute")
+
+#
+#  From xarrayutils : https://github.com/jbusecke/xarrayutils/blob/master/xarrayutils/vertical_coordinates.py
+#  Direct integration of those 2 functions to minimize dependencies and possibility of tuning them to our needs
+#
+
+
+def linear_interpolation_remap(
+    z,
+    data,
+    z_regridded,
+    z_dim=None,
+    z_regridded_dim="regridded",
+    output_dim="remapped"
+):
+    # interpolation called in xarray ufunc
+    def _regular_interp(x, y, target_values):
+        # remove all nans from input x and y
+        idx = np.logical_or(np.isnan(x), np.isnan(y))
+        x = x[~idx]
+        y = y[~idx]
+
+        # Need at least 5 points in the profile to interpolate, otherwise, return NaNs
+        if len(y) < 5:
+            interpolated = np.empty(len(target_values))
+            interpolated[:] = np.nan
+        else:
+            # replace nans in target_values without of bound Values (just in case)
+            target_values = np.where(
+                ~np.isnan(target_values), target_values, np.nanmax(x) + 1
+            )
+            # Interpolate with fill value parameter to extend min pressure toward 0
+            interpolated = interpolate.interp1d(
+                x, y, bounds_error=False, fill_value=(y[0], y[-1])
+            )(target_values)
+        return interpolated
+
+    # infer dim from input
+    if z_dim is None:
+        if len(z.dims) != 1:
+            raise RuntimeError("if z_dim is not specified, x must be a 1D array.")
+        dim = z.dims[0]
+    else:
+        dim = z_dim
+
+    # if dataset is passed drop all data_vars that dont contain dim
+    if isinstance(data, xr.Dataset):
+        raise ValueError("Dataset input is not supported yet")
+        # TODO: for a dataset input just apply the function for each appropriate array
+
+    if version.parse(xr.__version__) > version.parse("0.15.0"):
+        kwargs = dict(
+            input_core_dims=[[dim], [dim], [z_regridded_dim]],
+            output_core_dims=[[output_dim]],
+            vectorize=True,
+            dask="parallelized",
+            output_dtypes=[data.dtype],
+            dask_gufunc_kwargs={
+                "output_sizes": {output_dim: len(z_regridded[z_regridded_dim])}
+            },
+        )
+    else:
+        kwargs = dict(
+            input_core_dims=[[dim], [dim], [z_regridded_dim]],
+            output_core_dims=[[output_dim]],
+            vectorize=True,
+            dask="parallelized",
+            output_dtypes=[data.dtype],
+            output_sizes={output_dim: len(z_regridded[z_regridded_dim])},
+        )
+    remapped = xr.apply_ufunc(_regular_interp, z, data, z_regridded, **kwargs)
+
+    remapped.coords[output_dim] = z_regridded.rename(
+        {z_regridded_dim: output_dim}
+    ).coords[output_dim]
+    return remapped
+
+
+def groupby_remap(
+    z,
+    data,
+    z_regridded,  # noqa C901
+    z_dim=None,
+    z_regridded_dim="regridded",
+    output_dim="remapped",
+    select="deep",
+    right=False,
+):
+    """todo: Need a docstring here !"""
+
+    # sub-sampling called in xarray ufunc
+    def _subsample_bins(x, y, target_values):
+        # remove all nans from input x and y
+        try:
+            idx = np.logical_or(np.isnan(x), np.isnan(y))
+        except TypeError:
+            log.debug(
+                "Error with this '%s' y data content: %s" % (type(y), str(np.unique(y)))
+            )
+            raise
+        x = x[~idx]
+        y = y[~idx]
+
+        ifound = np.digitize(
+            x, target_values, right=right
+        )  # ``bins[i-1] <= x < bins[i]``
+        ifound -= 1  # Because digitize returns a 1-based indexing, we need to remove 1
+        y_binned = np.ones_like(target_values) * np.nan
+
+        for ib, this_ibin in enumerate(np.unique(ifound)):
+            ix = np.where(ifound == this_ibin)
+            iselect = ix[-1]
+
+            # Map to y value at specific x index in the bin:
+            if select == "shallow":
+                iselect = iselect[0]  # min/shallow
+                mapped_value = y[iselect]
+            elif select == "deep":
+                iselect = iselect[-1]  # max/deep
+                mapped_value = y[iselect]
+            elif select == "middle":
+                iselect = iselect[
+                    np.where(x[iselect] >= np.median(x[iselect]))[0][0]
+                ]  # median/middle
+                mapped_value = y[iselect]
+            elif select == "random":
+                iselect = iselect[np.random.randint(len(iselect))]
+                mapped_value = y[iselect]
+
+            # or Map to y statistics in the bin:
+            elif select == "mean":
+                mapped_value = np.nanmean(y[iselect])
+            elif select == "min":
+                mapped_value = np.nanmin(y[iselect])
+            elif select == "max":
+                mapped_value = np.nanmax(y[iselect])
+            elif select == "median":
+                mapped_value = np.median(y[iselect])
+
+            else:
+                raise InvalidOption("`select` option has invalid value (%s)" % select)
+
+            y_binned[this_ibin] = mapped_value
+
+        return y_binned
+
+    # infer dim from input
+    if z_dim is None:
+        if len(z.dims) != 1:
+            raise RuntimeError("if z_dim is not specified, x must be a 1D array.")
+        dim = z.dims[0]
+    else:
+        dim = z_dim
+
+    # if dataset is passed drop all data_vars that don't contain dim
+    if isinstance(data, xr.Dataset):
+        raise ValueError("Dataset input is not supported yet")
+        # TODO: for a dataset input just apply the function for each appropriate array
+
+    if version.parse(xr.__version__) > version.parse("0.15.0"):
+        kwargs = dict(
+            input_core_dims=[[dim], [dim], [z_regridded_dim]],
+            output_core_dims=[[output_dim]],
+            vectorize=True,
+            dask="parallelized",
+            output_dtypes=[data.dtype],
+            dask_gufunc_kwargs={
+                "output_sizes": {output_dim: len(z_regridded[z_regridded_dim])}
+            },
+        )
+    else:
+        kwargs = dict(
+            input_core_dims=[[dim], [dim], [z_regridded_dim]],
+            output_core_dims=[[output_dim]],
+            vectorize=True,
+            dask="parallelized",
+            output_dtypes=[data.dtype],
+            output_sizes={output_dim: len(z_regridded[z_regridded_dim])},
+        )
+    remapped = xr.apply_ufunc(_subsample_bins, z, data, z_regridded, **kwargs)
+
+    remapped.coords[output_dim] = z_regridded.rename(
+        {z_regridded_dim: output_dim}
+    ).coords[output_dim]
+    return remapped
diff --git a/argopy/utils/format.py b/argopy/utils/format.py
new file mode 100644
index 00000000..9ffd9ab6
--- /dev/null
+++ b/argopy/utils/format.py
@@ -0,0 +1,185 @@
+import os
+from urllib.parse import urlparse
+import logging
+
+
+log = logging.getLogger("argopy.utils.format")
+
+
+def format_oneline(s, max_width=65):
+    """ Return a string formatted for a line print """
+    if len(s) > max_width:
+        padding = " ... "
+        n = (max_width - len(padding)) // 2
+        q = (max_width - len(padding)) % 2
+        if q == 0:
+            return "".join([s[0: n], padding, s[-n:]])
+        else:
+            return "".join([s[0: n + 1], padding, s[-n:]])
+    else:
+        return s
+
+
+def argo_split_path(this_path):  # noqa C901
+    """ Split path from a GDAC ftp style Argo netcdf file and return information
+
+    >>> argo_split_path('coriolis/6901035/profiles/D6901035_001D.nc')
+    >>> argo_split_path('https://data-argo.ifremer.fr/dac/csiro/5903939/profiles/D5903939_103.nc')
+
+    Parameters
+    ----------
+    str
+
+    Returns
+    -------
+    dict
+    """
+    dacs = [
+        "aoml",
+        "bodc",
+        "coriolis",
+        "csio",
+        "csiro",
+        "incois",
+        "jma",
+        "kma",
+        "kordi",
+        "meds",
+        "nmdis",
+    ]
+    output = {}
+
+    start_with = lambda f, x: f[0:len(x)] == x if len(x) <= len(f) else False  # noqa: E731
+
+    def split_path(p, sep='/'):
+        """Split a pathname.  Returns tuple "(head, tail)" where "tail" is
+        everything after the final slash.  Either part may be empty."""
+        # Same as posixpath.py but we get to choose the file separator !
+        p = os.fspath(p)
+        i = p.rfind(sep) + 1
+        head, tail = p[:i], p[i:]
+        if head and head != sep * len(head):
+            head = head.rstrip(sep)
+        return head, tail
+
+    def fix_localhost(host):
+        if 'ftp://localhost:' in host:
+            return "ftp://%s" % (urlparse(host).netloc)
+        if 'http://127.0.0.1:' in host:
+            return "http://%s" % (urlparse(host).netloc)
+        else:
+            return ""
+
+    known_origins = ['https://data-argo.ifremer.fr',
+                     'ftp://ftp.ifremer.fr/ifremer/argo',
+                     'ftp://usgodae.org/pub/outgoing/argo',
+                     fix_localhost(this_path),
+                     '']
+
+    output['origin'] = [origin for origin in known_origins if start_with(this_path, origin)][0]
+    output['origin'] = '.' if output['origin'] == '' else output['origin'] + '/'
+    sep = '/' if output['origin'] != '.' else os.path.sep
+
+    (path, file) = split_path(this_path, sep=sep)
+
+    output['path'] = path.replace(output['origin'], '')
+    output['name'] = file
+
+    # Deal with the path:
+    # dac/<DAC>/<FloatWmoID>/
+    # dac/<DAC>/<FloatWmoID>/profiles
+    path_parts = path.split(sep)
+
+    try:
+        if path_parts[-1] == 'profiles':
+            output['type'] = 'Mono-cycle profile file'
+            output['wmo'] = path_parts[-2]
+            output['dac'] = path_parts[-3]
+        else:
+            output['type'] = 'Multi-cycle profile file'
+            output['wmo'] = path_parts[-1]
+            output['dac'] = path_parts[-2]
+    except Exception:
+        log.warning(this_path)
+        log.warning(path)
+        log.warning(sep)
+        log.warning(path_parts)
+        log.warning(output)
+        raise
+
+    if output['dac'] not in dacs:
+        log.debug("This is not a Argo GDAC compliant file path: %s" % path)
+        log.warning(this_path)
+        log.warning(path)
+        log.warning(sep)
+        log.warning(path_parts)
+        log.warning(output)
+        raise ValueError("This is not a Argo GDAC compliant file path (invalid DAC name: '%s')" % output['dac'])
+
+    # Deal with the file name:
+    filename, file_extension = os.path.splitext(output['name'])
+    output['extension'] = file_extension
+    if file_extension != '.nc':
+        raise ValueError(
+            "This is not a Argo GDAC compliant file path (invalid file extension: '%s')" % file_extension)
+    filename_parts = output['name'].split("_")
+
+    if "Mono" in output['type']:
+        prefix = filename_parts[0].split(output['wmo'])[0]
+        if 'R' in prefix:
+            output['data_mode'] = 'R, Real-time data'
+        if 'D' in prefix:
+            output['data_mode'] = 'D, Delayed-time data'
+
+        if 'S' in prefix:
+            output['type'] = 'S, Synthetic BGC Mono-cycle profile file'
+        if 'M' in prefix:
+            output['type'] = 'M, Merged BGC Mono-cycle profile file'
+        if 'B' in prefix:
+            output['type'] = 'B, BGC Mono-cycle profile file'
+
+        suffix = filename_parts[-1].split(output['wmo'])[-1]
+        if 'D' in suffix:
+            output['direction'] = 'D, descending profiles'
+        elif suffix == "" and "Mono" in output['type']:
+            output['direction'] = 'A, ascending profiles (implicit)'
+
+    else:
+        typ = filename_parts[-1].split(".nc")[0]
+        if typ == 'prof':
+            output['type'] = 'Multi-cycle file'
+        if typ == 'Sprof':
+            output['type'] = 'S, Synthetic BGC Multi-cycle profiles file'
+        if typ == 'tech':
+            output['type'] = 'Technical data file'
+        if typ == 'meta':
+            output['type'] = 'Metadata file'
+        if 'traj' in typ:
+            # possible typ = [Rtraj, Dtraj, BRtraj, BDtraj]
+            output['type'], i = 'Trajectory file', 0
+            if typ[0] == 'B':
+                output['type'], i = 'BGC Trajectory file', 1
+            if typ.split("traj")[0][i] == 'D':
+                output['data_mode'] = 'D, Delayed-time data'
+            elif typ.split("traj")[0][i] == 'R':
+                output['data_mode'] = 'R, Real-time data'
+            else:
+                output['data_mode'] = 'R, Real-time data (implicit)'
+
+    # Adjust origin and path for local files:
+    # This ensure that output['path'] is agnostic to users and can be reused on any gdac compliant architecture
+    parts = path.split(sep)
+    i, stop = len(parts) - 1, False
+    while not stop:
+        if parts[i] == 'profiles' or parts[i] == output['wmo'] or parts[i] == output['dac'] or parts[i] == 'dac':
+            i = i - 1
+            if i < 0:
+                stop = True
+        else:
+            stop = True
+    output['origin'] = sep.join(parts[0:i + 1])
+    output['path'] = output['path'].replace(output['origin'], '')
+
+    return dict(sorted(output.items()))
+
+
diff --git a/argopy/utils/geo.py b/argopy/utils/geo.py
new file mode 100644
index 00000000..cc304f41
--- /dev/null
+++ b/argopy/utils/geo.py
@@ -0,0 +1,149 @@
+import numpy as np
+import pandas as pd
+
+
+def wrap_longitude(grid_long):
+    """ Allows longitude (0-360) to wrap beyond the 360 mark, for mapping purposes.
+        Makes sure that, if the longitude is near the boundary (0 or 360) that we
+        wrap the values beyond 360 so it appears nicely on a map
+        This is a refactor between get_region_data and get_region_hist_locations to
+        avoid duplicate code
+
+        source:
+        https://github.com/euroargodev/argodmqc_owc/blob/e174f4538fdae1534c9740491398972b1ffec3ca/pyowc/utilities.py#L80
+
+        Parameters
+        ----------
+        grid_long: array of longitude values
+
+        Returns
+        -------
+        array of longitude values that can extend past 360
+    """
+    neg_long = np.argwhere(grid_long < 0)
+    grid_long[neg_long] = grid_long[neg_long] + 360
+
+    # if we have data close to upper boundary (360), then wrap some of the data round
+    # so it appears on the map
+    top_long = np.argwhere(grid_long >= 320)
+    if top_long.__len__() != 0:
+        bottom_long = np.argwhere(grid_long <= 40)
+        grid_long[bottom_long] = 360 + grid_long[bottom_long]
+
+    return grid_long
+
+
+def wmo2box(wmo_id: int):
+    """ Convert WMO square box number into a latitude/longitude box
+
+    See:
+    https://en.wikipedia.org/wiki/World_Meteorological_Organization_squares
+    https://commons.wikimedia.org/wiki/File:WMO-squares-global.gif
+
+    Parameters
+    ----------
+    wmo_id: int
+        WMO square number, must be between 1000 and 7817
+
+    Returns
+    -------
+    box: list(int)
+        [lon_min, lon_max, lat_min, lat_max] bounds to the WMO square number
+    """
+    if wmo_id < 1000 or wmo_id > 7817:
+        raise ValueError("Invalid WMO square number, must be between 1000 and 7817.")
+    wmo_id = str(wmo_id)
+
+    # "global quadrant" numbers where 1=NE, 3=SE, 5=SW, 7=NW
+    quadrant = int(wmo_id[0])
+    if quadrant not in [1, 3, 5, 7]:
+        raise ValueError("Invalid WMO square number, 1st digit must be 1, 3, 5 or 7.")
+
+    # 'minimum' Latitude square boundary, nearest to the Equator
+    nearest_to_the_Equator_latitude = int(wmo_id[1])
+
+    # 'minimum' Longitude square boundary, nearest to the Prime Meridian
+    nearest_to_the_Prime_Meridian = int(wmo_id[2:4])
+
+    #
+    dd = 10
+    if quadrant in [1, 3]:
+        lon_min = nearest_to_the_Prime_Meridian * dd
+        lon_max = nearest_to_the_Prime_Meridian * dd + dd
+    elif quadrant in [5, 7]:
+        lon_min = -nearest_to_the_Prime_Meridian * dd - dd
+        lon_max = -nearest_to_the_Prime_Meridian * dd
+
+    if quadrant in [1, 7]:
+        lat_min = nearest_to_the_Equator_latitude * dd
+        lat_max = nearest_to_the_Equator_latitude * dd + dd
+    elif quadrant in [3, 5]:
+        lat_min = -nearest_to_the_Equator_latitude * dd - dd
+        lat_max = -nearest_to_the_Equator_latitude * dd
+
+    box = [lon_min, lon_max, lat_min, lat_max]
+    return box
+
+
+def toYearFraction(
+    this_date: pd._libs.tslibs.timestamps.Timestamp = pd.to_datetime("now", utc=True)
+):
+    """ Compute decimal year, robust to leap years, precision to the second
+
+    Compute the fraction of the year a given timestamp corresponds to.
+    The "fraction of the year" goes:
+    - from 0 on 01-01T00:00:00.000 of the year
+    - to 1 on the 01-01T00:00:00.000 of the following year
+
+    1 second corresponds to the number of days in the year times 86400.
+    The faction of the year is rounded to 10-digits in order to have a "second" precision.
+
+    See discussion here: https://github.com/euroargodev/argodmqc_owc/issues/35
+
+    Parameters
+    ----------
+    pd._libs.tslibs.timestamps.Timestamp
+
+    Returns
+    -------
+    float
+    """
+    if "UTC" in [this_date.tzname() if this_date.tzinfo is not None else ""]:
+        startOfThisYear = pd.to_datetime("%i-01-01T00:00:00.000" % this_date.year, utc=True)
+    else:
+        startOfThisYear = pd.to_datetime("%i-01-01T00:00:00.000" % this_date.year)
+    yearDuration_sec = (
+        startOfThisYear + pd.offsets.DateOffset(years=1) - startOfThisYear
+    ).total_seconds()
+
+    yearElapsed_sec = (this_date - startOfThisYear).total_seconds()
+    fraction = yearElapsed_sec / yearDuration_sec
+    fraction = np.round(fraction, 10)
+    return this_date.year + fraction
+
+
+def YearFraction_to_datetime(yf: float):
+    """ Compute datetime from year fraction
+
+    Inverse the toYearFraction() function
+
+    Parameters
+    ----------
+    float
+
+    Returns
+    -------
+    pd._libs.tslibs.timestamps.Timestamp
+    """
+    year = np.int32(yf)
+    fraction = yf - year
+    fraction = np.round(fraction, 10)
+
+    startOfThisYear = pd.to_datetime("%i-01-01T00:00:00" % year)
+    yearDuration_sec = (
+        startOfThisYear + pd.offsets.DateOffset(years=1) - startOfThisYear
+    ).total_seconds()
+    yearElapsed_sec = pd.Timedelta(fraction * yearDuration_sec, unit="s")
+    return pd.to_datetime(startOfThisYear + yearElapsed_sec, unit="s")
+
+
diff --git a/argopy/utils/locals.py b/argopy/utils/locals.py
new file mode 100644
index 00000000..8c282113
--- /dev/null
+++ b/argopy/utils/locals.py
@@ -0,0 +1,244 @@
+import os
+import sys
+import subprocess  # nosec B404 only used without user inputs
+import platform
+import locale
+import struct
+import importlib
+import contextlib
+import copy
+from ..options import OPTIONS
+
+
+def get_sys_info():
+    """Returns system information as a dict"""
+
+    blob = []
+
+    # get full commit hash
+    commit = None
+    if os.path.isdir(".git") and os.path.isdir("argopy"):
+        try:
+            pipe = subprocess.Popen(  # nosec No user provided input to control here
+                'git log --format="%H" -n 1'.split(" "),
+                stdout=subprocess.PIPE,
+                stderr=subprocess.PIPE,
+            )
+            so, serr = pipe.communicate()
+        except Exception:
+            pass
+        else:
+            if pipe.returncode == 0:
+                commit = so
+                try:
+                    commit = so.decode("utf-8")
+                except ValueError:
+                    pass
+                commit = commit.strip().strip('"')
+
+    blob.append(("commit", commit))
+
+    try:
+        (sysname, nodename, release, version_, machine, processor) = platform.uname()
+        blob.extend(
+            [
+                ("python", sys.version),
+                ("python-bits", struct.calcsize("P") * 8),
+                ("OS", "%s" % (sysname)),
+                ("OS-release", "%s" % (release)),
+                ("machine", "%s" % (machine)),
+                ("processor", "%s" % (processor)),
+                ("byteorder", "%s" % sys.byteorder),
+                ("LC_ALL", "%s" % os.environ.get("LC_ALL", "None")),
+                ("LANG", "%s" % os.environ.get("LANG", "None")),
+                ("LOCALE", "%s.%s" % locale.getlocale()),
+            ]
+        )
+    except Exception:
+        pass
+
+    return blob
+
+
+def netcdf_and_hdf5_versions():
+    libhdf5_version = None
+    libnetcdf_version = None
+    try:
+        import netCDF4
+
+        libhdf5_version = netCDF4.__hdf5libversion__
+        libnetcdf_version = netCDF4.__netcdf4libversion__
+    except ImportError:
+        try:
+            import h5py
+
+            libhdf5_version = h5py.version.hdf5_version
+        except ImportError:
+            pass
+    return [("libhdf5", libhdf5_version), ("libnetcdf", libnetcdf_version)]
+
+
+def show_versions(file=sys.stdout, conda=False):  # noqa: C901
+    """ Print the versions of argopy and its dependencies
+
+    Parameters
+    ----------
+    file : file-like, optional
+        print to the given file-like object. Defaults to sys.stdout.
+    conda: bool, optional
+        format versions to be copy/pasted on a conda environment file (default, False)
+    """
+    sys_info = get_sys_info()
+
+    try:
+        sys_info.extend(netcdf_and_hdf5_versions())
+    except Exception as e:
+        print(f"Error collecting netcdf / hdf5 version: {e}")
+
+    DEPS = {
+        'core': sorted([
+            ("argopy", lambda mod: mod.__version__),
+
+            ("xarray", lambda mod: mod.__version__),
+            ("scipy", lambda mod: mod.__version__),
+            ("netCDF4", lambda mod: mod.__version__),
+            ("erddapy", lambda mod: mod.__version__),  # This could go away from requirements ?
+            ("fsspec", lambda mod: mod.__version__),
+            ("aiohttp", lambda mod: mod.__version__),
+            ("packaging", lambda mod: mod.__version__),  # will come with xarray, Using 'version' to make API compatible with several fsspec releases
+            ("requests", lambda mod: mod.__version__),
+            ("toolz", lambda mod: mod.__version__),
+        ]),
+        'ext.util': sorted([
+            ("gsw", lambda mod: mod.__version__),   # Used by xarray accessor to compute new variables
+            ("tqdm", lambda mod: mod.__version__),
+            ("zarr", lambda mod: mod.__version__),
+        ]),
+        'ext.perf': sorted([
+            ("dask", lambda mod: mod.__version__),
+            ("distributed", lambda mod: mod.__version__),
+            ("pyarrow", lambda mod: mod.__version__),
+        ]),
+        'ext.plot': sorted([
+            ("matplotlib", lambda mod: mod.__version__),
+            ("cartopy", lambda mod: mod.__version__),
+            ("seaborn", lambda mod: mod.__version__),
+            ("IPython", lambda mod: mod.__version__),
+            ("ipywidgets", lambda mod: mod.__version__),
+            ("ipykernel", lambda mod: mod.__version__),
+        ]),
+        'dev': sorted([
+
+            ("bottleneck", lambda mod: mod.__version__),
+            ("cftime", lambda mod: mod.__version__),
+            ("cfgrib", lambda mod: mod.__version__),
+            ("conda", lambda mod: mod.__version__),
+            ("nc_time_axis", lambda mod: mod.__version__),
+
+            ("numpy", lambda mod: mod.__version__),  # will come with xarray and pandas
+            ("pandas", lambda mod: mod.__version__),  # will come with xarray
+
+            ("pip", lambda mod: mod.__version__),
+            ("black", lambda mod: mod.__version__),
+            ("flake8", lambda mod: mod.__version__),
+            ("pytest", lambda mod: mod.__version__),  # will come with pandas
+            ("pytest_env", lambda mod: mod.__version__),  # will come with pandas
+            ("pytest_cov", lambda mod: mod.__version__),  # will come with pandas
+            ("pytest_localftpserver", lambda mod: mod.__version__),  # will come with pandas
+            ("pytest_reportlog", lambda mod: mod.__version__),  # will come with pandas
+            ("setuptools", lambda mod: mod.__version__),
+            ("aiofiles", lambda mod: mod.__version__),
+            ("sphinx", lambda mod: mod.__version__),
+        ]),
+    }
+
+    DEPS_blob = {}
+    for level in DEPS.keys():
+        deps = DEPS[level]
+        deps_blob = list()
+        for (modname, ver_f) in deps:
+            try:
+                if modname in sys.modules:
+                    mod = sys.modules[modname]
+                else:
+                    mod = importlib.import_module(modname)
+            except Exception:
+                deps_blob.append((modname, '-'))
+            else:
+                try:
+                    ver = ver_f(mod)
+                    deps_blob.append((modname, ver))
+                except Exception:
+                    deps_blob.append((modname, "installed"))
+        DEPS_blob[level] = deps_blob
+
+    print("\nSYSTEM", file=file)
+    print("------", file=file)
+    for k, stat in sys_info:
+        print(f"{k}: {stat}", file=file)
+
+    for level in DEPS_blob:
+        if conda:
+            print("\n# %s:" % level.upper(), file=file)
+        else:
+            title = "INSTALLED VERSIONS: %s" % level.upper()
+            print("\n%s" % title, file=file)
+            print("-" * len(title), file=file)
+        deps_blob = DEPS_blob[level]
+        for k, stat in deps_blob:
+            if conda:
+                if k != 'argopy':
+                    kf = k.replace("_", "-")
+                    comment = ' ' if stat != '-' else '# '
+                    print(f"{comment} - {kf} = {stat}", file=file)  # Format like a conda env line, useful to update ci/requirements
+            else:
+                print("{:<12}: {:<12}".format(k, stat), file=file)
+
+
+@contextlib.contextmanager
+def modified_environ(*remove, **update):
+    """
+    Temporarily updates the ``os.environ`` dictionary in-place.
+
+    The ``os.environ`` dictionary is updated in-place so that the modification
+    is sure to work in all situations.
+
+    :param remove: Environment variables to remove.
+    :param update: Dictionary of environment variables and values to add/update.
+    """
+    # Source: https://github.com/laurent-laporte-pro/stackoverflow-q2059482
+    env = os.environ
+    update = update or {}
+    remove = remove or []
+
+    # List of environment variables being updated or removed.
+    stomped = (set(update.keys()) | set(remove)) & set(env.keys())
+    # Environment variables and values to restore on exit.
+    update_after = {k: env[k] for k in stomped}
+    # Environment variables and values to remove on exit.
+    remove_after = frozenset(k for k in update if k not in env)
+
+    try:
+        env.update(update)
+        [env.pop(k, None) for k in remove]
+        yield
+    finally:
+        env.update(update_after)
+        [env.pop(k) for k in remove_after]
+
+
+def show_options(file=sys.stdout):  # noqa: C901
+    """ Print options of argopy
+
+    Parameters
+    ----------
+    file : file-like, optional
+        print to the given file-like object. Defaults to sys.stdout.
+    """
+    print("\nARGOPY OPTIONS", file=file)
+    print("--------------", file=file)
+    opts = copy.deepcopy(OPTIONS)
+    opts = dict(sorted(opts.items()))
+    for k, v in opts.items():
+        print(f"{k}: {v}", file=file)
+
diff --git a/argopy/utils/loggers.py b/argopy/utils/loggers.py
new file mode 100644
index 00000000..b76b8450
--- /dev/null
+++ b/argopy/utils/loggers.py
@@ -0,0 +1,44 @@
+import warnings
+import inspect
+import pathlib
+import os
+import logging
+
+
+log = logging.getLogger("argopy.utils.loggers")
+
+
+def warnUnless(ok, txt):
+    """Function to raise a warning unless condition is True
+
+    This function IS NOT to be used as a decorator anymore
+
+    Parameters
+    ----------
+    ok: bool
+        Condition to raise the warning or not
+    txt: str
+        Text to display in the warning
+    """
+    if not ok:
+        msg = "%s %s" % (inspect.stack()[1].function, txt)
+        warnings.warn(msg)
+
+
+def log_argopy_callerstack(level='debug'):
+    """log the caller’s stack"""
+    froot = str(pathlib.Path(__file__).parent.resolve())
+    for ideep, frame in enumerate(inspect.stack()[1:]):
+        if os.path.join('argopy', 'argopy') in frame.filename:
+            # msg = ["└─"]
+            # [msg.append("─") for ii in range(ideep)]
+            msg = [""]
+            [msg.append("  ") for ii in range(ideep)]
+            msg.append("└─ %s:%i -> %s" % (frame.filename.replace(froot, ''), frame.lineno, frame.function))
+            msg = "".join(msg)
+            if level == "info":
+                log.info(msg)
+            elif level == "debug":
+                log.debug(msg)
+            elif level == "warning":
+                log.warning(msg)
diff --git a/argopy/utils/manip.py b/argopy/utils/manip.py
new file mode 100644
index 00000000..8874fac3
--- /dev/null
+++ b/argopy/utils/manip.py
@@ -0,0 +1,126 @@
+import numpy as np
+import xarray as xr
+import logging
+
+
+log = logging.getLogger("argopy.utils.manip")
+
+
+def drop_variables_not_in_all_datasets(ds_collection):
+    """Drop variables that are not in all datasets (the lowest common denominator)
+
+    Parameters
+    ----------
+    list of :class:`xr.DataSet`
+
+    Returns
+    -------
+    list of :class:`xr.DataSet`
+    """
+
+    # List all possible data variables:
+    vlist = []
+    for res in ds_collection:
+        [vlist.append(v) for v in list(res.data_vars)]
+    vlist = np.unique(vlist)
+
+    # Check if each variables are in each datasets:
+    ishere = np.zeros((len(vlist), len(ds_collection)))
+    for ir, res in enumerate(ds_collection):
+        for iv, v in enumerate(res.data_vars):
+            for iu, u in enumerate(vlist):
+                if v == u:
+                    ishere[iu, ir] = 1
+
+    # List of dataset with missing variables:
+    # ir_missing = np.sum(ishere, axis=0) < len(vlist)
+    # List of variables missing in some dataset:
+    iv_missing = np.sum(ishere, axis=1) < len(ds_collection)
+    if len(iv_missing) > 0:
+        log.debug("Dropping these variables that are missing from some dataset in this list: %s" % vlist[iv_missing])
+
+    # List of variables to keep
+    iv_tokeep = np.sum(ishere, axis=1) == len(ds_collection)
+    for ir, res in enumerate(ds_collection):
+        #         print("\n", res.attrs['Fetched_uri'])
+        v_to_drop = []
+        for iv, v in enumerate(res.data_vars):
+            if v not in vlist[iv_tokeep]:
+                v_to_drop.append(v)
+        ds_collection[ir] = ds_collection[ir].drop_vars(v_to_drop)
+    return ds_collection
+
+
+def fill_variables_not_in_all_datasets(ds_collection, concat_dim='rows'):
+    """Add empty variables to dataset so that all the collection have the same data_vars and coords
+
+    This is to make sure that the collection of dataset can be concatenated
+
+    Parameters
+    ----------
+    list of :class:`xr.DataSet`
+
+    Returns
+    -------
+    list of :class:`xr.DataSet`
+    """
+    def first_variable_with_concat_dim(this_ds, concat_dim='rows'):
+        """Return the 1st variable in the collection that have the concat_dim in dims"""
+        first = None
+        for v in this_ds.data_vars:
+            if concat_dim in this_ds[v].dims:
+                first = v
+                pass
+        return first
+
+    def fillvalue(da):
+        """ Return fillvalue for a dataarray """
+        # https://docs.scipy.org/doc/numpy/reference/generated/numpy.dtype.kind.html#numpy.dtype.kind
+        if da.dtype.kind in ["U"]:
+            fillvalue = " "
+        elif da.dtype.kind == "i":
+            fillvalue = 99999
+        elif da.dtype.kind == "M":
+            fillvalue = np.datetime64("NaT")
+        else:
+            fillvalue = np.nan
+        return fillvalue
+
+    # List all possible data variables:
+    vlist = []
+    for res in ds_collection:
+        [vlist.append(v) for v in list(res.variables) if concat_dim in res[v].dims]
+    vlist = np.unique(vlist)
+    # log.debug('variables', vlist)
+
+    # List all possible coordinates:
+    clist = []
+    for res in ds_collection:
+        [clist.append(c) for c in list(res.coords) if concat_dim in res[c].dims]
+    clist = np.unique(clist)
+    # log.debu('coordinates', clist)
+
+    # Get the first occurrence of each variable, to be used as a template for attributes and dtype
+    meta = {}
+    for ir, ds in enumerate(ds_collection):
+        for v in vlist:
+            if v in ds.variables:
+                meta[v] = {'attrs': ds[v].attrs, 'dtype': ds[v].dtype, 'fill_value': fillvalue(ds[v])}
+    # [log.debug(meta[m]) for m in meta.keys()]
+
+    # Add missing variables to dataset
+    datasets = [ds.copy() for ds in ds_collection]
+    for ir, ds in enumerate(datasets):
+        for v in vlist:
+            if v not in ds.variables:
+                like = ds[first_variable_with_concat_dim(ds, concat_dim=concat_dim)]
+                datasets[ir][v] = xr.full_like(like, fill_value=meta[v]['fill_value'], dtype=meta[v]['dtype'])
+                datasets[ir][v].attrs = meta[v]['attrs']
+
+    # Make sure that all datasets have the same set of coordinates
+    results = []
+    for ir, ds in enumerate(datasets):
+        results.append(datasets[ir].set_coords(clist))
+
+    #
+    return results
diff --git a/argopy/utils/monitors.py b/argopy/utils/monitors.py
new file mode 100644
index 00000000..09007b03
--- /dev/null
+++ b/argopy/utils/monitors.py
@@ -0,0 +1,169 @@
+import urllib
+import warnings
+import importlib
+import time
+import threading
+
+try:
+    importlib.import_module('matplotlib')  # noqa: E402
+    from matplotlib.colors import to_hex
+except ImportError:
+    pass
+
+from .lists import list_available_data_src
+from .checkers import isAPIconnected
+
+
+def badge(label="label", message="message", color="green", insert=False):
+    """ Return or insert shield.io badge image
+
+        Use the shields.io service to create a badge image
+
+        https://img.shields.io/static/v1?label=<LABEL>&message=<MESSAGE>&color=<COLOR>
+
+    Parameters
+    ----------
+    label: str
+        Left side badge text
+    message: str
+        Right side badge text
+    color: str
+        Right side background color
+    insert: bool
+        Return url to badge image (False, default) or directly insert the image with HTML (True)
+
+    Returns
+    -------
+    str or IPython.display.Image
+    """
+    from IPython.display import Image
+
+    url = (
+        "https://img.shields.io/static/v1?style=flat-square&label={}&message={}&color={}"
+    ).format
+    img = url(urllib.parse.quote(label), urllib.parse.quote(message), color)
+    if not insert:
+        return img
+    else:
+        return Image(url=img)
+
+
+class fetch_status:
+    """Fetch and report web API status"""
+
+    def __init__(self, **kwargs):
+        if "stdout" in kwargs or "insert" in kwargs:
+            warnings.warn("'fetch_status' signature has changed")
+        pass
+
+    def fetch(self):
+        results = {}
+        list_src = list_available_data_src()
+        for api, mod in list_src.items():
+            if getattr(mod, "api_server_check", None):
+                status = isAPIconnected(api)
+                message = "ok" if status else "offline"
+                results[api] = {"value": status, "message": message}
+        return results
+
+    @property
+    def text(self):
+        results = self.fetch()
+        rows = []
+        for api in sorted(results.keys()):
+            rows.append("src %s is: %s" % (api, results[api]["message"]))
+        txt = " | ".join(rows)
+        return txt
+
+    def __repr__(self):
+        return self.text
+
+    @property
+    def html(self):
+        results = self.fetch()
+
+        fs = 12
+
+        def td_msg(bgcolor, txtcolor, txt):
+            style = "background-color:%s;" % to_hex(bgcolor, keep_alpha=True)
+            style += "border-width:0px;"
+            style += "padding: 2px 5px 2px 5px;"
+            style += "text-align:left;"
+            style += "color:%s" % to_hex(txtcolor, keep_alpha=True)
+            return "<td style='%s'>%s</td>" % (style, str(txt))
+
+        td_empty = "<td style='border-width:0px;padding: 2px 5px 2px 5px;text-align:left'>&nbsp;</td>"
+
+        html = []
+        html.append("<table style='border-collapse:collapse;border-spacing:0;font-size:%ipx'>" % fs)
+        html.append("<tbody><tr>")
+        cols = []
+        for api in sorted(results.keys()):
+            color = "yellowgreen" if results[api]["value"] else "darkorange"
+            cols.append(td_msg('dimgray', 'w', "src %s is" % api))
+            cols.append(td_msg(color, 'w', results[api]["message"]))
+            cols.append(td_empty)
+        html.append("\n".join(cols))
+        html.append("</tr></tbody>")
+        html.append("</table>")
+        html = "\n".join(html)
+        return html
+
+    def _repr_html_(self):
+        return self.html
+
+
+class monitor_status:
+    """ Monitor data source status with a refresh rate """
+
+    def __init__(self, refresh=60):
+        self.refresh_rate = refresh
+
+        if self.runner == 'notebook':
+            import ipywidgets as widgets
+
+            self.text = widgets.HTML(
+                value=self.content,
+                placeholder="",
+                description="",
+            )
+            self.start()
+
+    def __repr__(self):
+        if self.runner != 'notebook':
+            return self.content
+        else:
+            return ""
+
+    @property
+    def runner(self) -> str:
+        try:
+            shell = get_ipython().__class__.__name__
+            if shell == 'ZMQInteractiveShell':
+                return 'notebook'  # Jupyter notebook or qtconsole
+            elif shell == 'TerminalInteractiveShell':
+                return 'terminal'  # Terminal running IPython
+            else:
+                return False  # Other type (?)
+        except NameError:
+            return 'standard'  # Probably standard Python interpreter
+
+    @property
+    def content(self):
+        if self.runner == 'notebook':
+            return fetch_status().html
+        else:
+            return fetch_status().text
+
+    def work(self):
+        while True:
+            time.sleep(self.refresh_rate)
+            self.text.value = self.content
+
+    def start(self):
+        from IPython.display import display
+
+        thread = threading.Thread(target=self.work)
+        display(self.text)
+        thread.start()
+
diff --git a/argopy/xarray.py b/argopy/xarray.py
index 1ccc8f99..8acc7b1c 100644
--- a/argopy/xarray.py
+++ b/argopy/xarray.py
@@ -14,18 +14,13 @@
 except ModuleNotFoundError:
     with_gsw = False
 
-from .utilities import (
-    linear_interpolation_remap,
-    toYearFraction,
-    groupby_remap,
-    # log_argopy_callerstack,
-)
-
 from .utils import (
     is_list_of_strings,
-    # is_list_equal,
     cast_Argo_variable_type,
     DATA_TYPES,
+    linear_interpolation_remap,
+    groupby_remap,
+    toYearFraction,
 )
 from .errors import InvalidDatasetStructure, DataNotFound, OptionValueError
 

From d313af216cef6b4ce8c1212d29e9029f72cf2feb Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Mon, 11 Sep 2023 15:20:50 +0200
Subject: [PATCH 18/33] Update transform.py

---
 argopy/utils/{manip.py => transform.py} | 3 +++
 1 file changed, 3 insertions(+)
 rename argopy/utils/{manip.py => transform.py} (98%)

diff --git a/argopy/utils/manip.py b/argopy/utils/transform.py
similarity index 98%
rename from argopy/utils/manip.py
rename to argopy/utils/transform.py
index 8874fac3..df55afba 100644
--- a/argopy/utils/manip.py
+++ b/argopy/utils/transform.py
@@ -1,3 +1,6 @@
+"""
+Manipulate/transform xarray objects or list of objects
+"""
 import numpy as np
 import xarray as xr
 import logging

From eb4f7afdb5da2ebf0d8342cef7d51a563aa7ad59 Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Mon, 11 Sep 2023 15:21:17 +0200
Subject: [PATCH 19/33] Delete plotters.py

re-inforce deprecation warning since 0.1.13
---
 argopy/plotters.py | 40 ----------------------------------------
 1 file changed, 40 deletions(-)
 delete mode 100644 argopy/plotters.py

diff --git a/argopy/plotters.py b/argopy/plotters.py
deleted file mode 100644
index 08b12669..00000000
--- a/argopy/plotters.py
+++ /dev/null
@@ -1,40 +0,0 @@
-import warnings
-warnings.filterwarnings("default", category=DeprecationWarning, module=__name__)
-
-
-def deprecation_of_plotters():
-    warnings.warn(
-        "The 'argopy.plotters' has been replaced by 'argopy.plot'. After 0.1.13, importing 'plotters' "
-        "will raise an error. You're seeing this message because you called this function through "
-        "the argopy 'plotters' module.",
-        category=DeprecationWarning,
-        stacklevel=2,
-    )
-
-
-def open_dashboard(*args, **kwargs):
-    deprecation_of_plotters()
-    from .plot import dashboard
-    return dashboard(*args, **kwargs)
-
-
-def open_sat_altim_report(*args, **kwargs):
-    deprecation_of_plotters()
-    from .plot import open_sat_altim_report
-    return open_sat_altim_report(*args, **kwargs)
-
-
-def plot_trajectory(*args, **kwargs):
-    deprecation_of_plotters()
-    from .plot import plot_trajectory
-    return plot_trajectory(*args, **kwargs)
-
-
-def bar_plot(*args, **kwargs):
-    deprecation_of_plotters()
-    from .plot import bar_plot
-    return bar_plot(*args, **kwargs)
-
-
-if __name__ == "argopy.plotters":
-    deprecation_of_plotters()

From 29d93558739c84f44116230560b814606ebda47b Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Mon, 11 Sep 2023 15:54:51 +0200
Subject: [PATCH 20/33] Make uniform internal module import

- Use module.submodule instead of module.__init__
- removed circular imports
---
 argopy/__init__.py                            |  2 +-
 argopy/data_fetchers/argovis_data.py          |  4 +--
 argopy/data_fetchers/erddap_data.py           |  3 +-
 argopy/data_fetchers/erddap_index.py          |  2 +-
 argopy/data_fetchers/erddap_refdata.py        |  2 +-
 argopy/data_fetchers/gdacftp_data.py          |  2 +-
 argopy/data_fetchers/gdacftp_index.py         |  2 +-
 argopy/data_fetchers/proto.py                 |  2 +-
 argopy/fetchers.py                            | 15 ++++----
 argopy/options.py                             |  2 +-
 argopy/plot/argo_colors.py                    |  2 +-
 argopy/plot/dashboards.py                     |  3 +-
 argopy/plot/plot.py                           |  4 +--
 argopy/plot/utils.py                          |  2 +-
 argopy/related/euroargo_api.py                |  2 +-
 argopy/related/topography.py                  |  2 +-
 argopy/stores/__init__.py                     |  2 +-
 argopy/stores/argo_index_pa.py                |  8 +++--
 argopy/stores/argo_index_pd.py                |  3 +-
 argopy/stores/argo_index_proto.py             |  3 +-
 argopy/stores/filesystems.py                  |  9 +++--
 argopy/tests/test_fetchers_data_argovis.py    |  2 +-
 argopy/tests/test_fetchers_data_erddap.py     |  2 +-
 argopy/tests/test_fetchers_data_erddap_bgc.py |  2 +-
 argopy/tests/test_fetchers_data_gdac.py       |  5 ++-
 argopy/tests/test_fetchers_index_gdac.py      |  3 +-
 argopy/tests/test_plot_argo_colors.py         |  3 +-
 argopy/tests/test_plot_plot.py                |  2 +-
 argopy/tests/test_plotters.py                 | 35 -------------------
 argopy/tests/test_stores_fsspec.py            |  6 ++--
 argopy/tests/test_stores_index.py             |  4 +--
 argopy/tests/test_utilities.py                | 35 -------------------
 argopy/tests/test_utils_caching.py            |  9 ++---
 argopy/tests/test_utils_locals.py             |  2 +-
 argopy/tests/test_xarray_engine.py            |  2 +-
 argopy/tutorial.py                            |  1 +
 argopy/utilities.py                           | 22 ++++++++++++
 argopy/utils/__init__.py                      |  2 +-
 argopy/utils/casting.py                       |  2 ++
 argopy/utils/checkers.py                      |  6 ++--
 argopy/utils/chunking.py                      |  2 +-
 argopy/utils/compute.py                       |  4 +++
 argopy/utils/format.py                        |  3 ++
 argopy/xarray.py                              |  8 +++--
 44 files changed, 100 insertions(+), 138 deletions(-)
 delete mode 100644 argopy/tests/test_plotters.py
 delete mode 100644 argopy/tests/test_utilities.py
 create mode 100644 argopy/utilities.py

diff --git a/argopy/__init__.py b/argopy/__init__.py
index 6ab892b1..dc71b2db 100644
--- a/argopy/__init__.py
+++ b/argopy/__init__.py
@@ -71,7 +71,7 @@
     "ArgoDOI",  # Class
 
     # Submodules:
-    "utilities",
+    "utilities",  # todo: send a deprecation warning when using argopy.utilities
     "errors",
     "plot",
     "ArgoColors",  # Class
diff --git a/argopy/data_fetchers/argovis_data.py b/argopy/data_fetchers/argovis_data.py
index f57a22c7..536a4862 100644
--- a/argopy/data_fetchers/argovis_data.py
+++ b/argopy/data_fetchers/argovis_data.py
@@ -14,8 +14,8 @@
 
 from ..stores import httpstore
 from ..options import OPTIONS
-from ..utilities import format_oneline
-from ..utils import Chunker
+from ..utils.format import format_oneline
+from ..utils.chunking import Chunker
 from ..errors import DataNotFound
 from .proto import ArgoDataFetcherProto
 
diff --git a/argopy/data_fetchers/erddap_data.py b/argopy/data_fetchers/erddap_data.py
index e817f087..a9869ab8 100644
--- a/argopy/data_fetchers/erddap_data.py
+++ b/argopy/data_fetchers/erddap_data.py
@@ -10,7 +10,6 @@
 
 """
 
-import argopy.utilities
 import xarray as xr
 import pandas as pd
 import numpy as np
@@ -25,7 +24,7 @@
 import logging
 
 from ..options import OPTIONS
-from ..utilities import format_oneline
+from ..utils.format import format_oneline
 from ..stores import httpstore
 from ..errors import ErddapServerError, DataNotFound
 from ..stores import indexstore_pd as ArgoIndex  # make sure we work with the Pandas index store
diff --git a/argopy/data_fetchers/erddap_index.py b/argopy/data_fetchers/erddap_index.py
index 5cf84730..e224f690 100644
--- a/argopy/data_fetchers/erddap_index.py
+++ b/argopy/data_fetchers/erddap_index.py
@@ -17,7 +17,7 @@
 
 from abc import ABC, abstractmethod
 
-from ..utilities import format_oneline
+from ..utils.format import format_oneline
 from ..related import load_dict, mapp_dict
 from ..stores import httpstore
 from ..options import OPTIONS
diff --git a/argopy/data_fetchers/erddap_refdata.py b/argopy/data_fetchers/erddap_refdata.py
index 1b07bf4e..1aef04e8 100644
--- a/argopy/data_fetchers/erddap_refdata.py
+++ b/argopy/data_fetchers/erddap_refdata.py
@@ -4,7 +4,7 @@
 import xarray as xr
 import logging
 from ..options import OPTIONS
-from ..utils import Chunker
+from ..utils.chunking import Chunker
 from ..stores import httpstore_erddap_auth
 from .erddap_data import ErddapArgoDataFetcher
 
diff --git a/argopy/data_fetchers/gdacftp_data.py b/argopy/data_fetchers/gdacftp_data.py
index d6ee4599..ef45e74d 100644
--- a/argopy/data_fetchers/gdacftp_data.py
+++ b/argopy/data_fetchers/gdacftp_data.py
@@ -12,7 +12,7 @@
 import getpass
 import logging
 
-from ..utilities import format_oneline, argo_split_path
+from ..utils.format import format_oneline, argo_split_path
 from ..options import OPTIONS, check_gdac_path
 from ..errors import DataNotFound
 from ..stores import ArgoIndex
diff --git a/argopy/data_fetchers/gdacftp_index.py b/argopy/data_fetchers/gdacftp_index.py
index 7b11f73d..7b0400a6 100644
--- a/argopy/data_fetchers/gdacftp_index.py
+++ b/argopy/data_fetchers/gdacftp_index.py
@@ -11,7 +11,7 @@
 import logging
 import importlib
 
-from ..utilities import format_oneline
+from ..utils.format import format_oneline
 from ..options import OPTIONS, check_gdac_path
 from ..plot import dashboard
 
diff --git a/argopy/data_fetchers/proto.py b/argopy/data_fetchers/proto.py
index a3f0ded1..412a01e2 100644
--- a/argopy/data_fetchers/proto.py
+++ b/argopy/data_fetchers/proto.py
@@ -5,7 +5,7 @@
 import hashlib
 import warnings
 from ..plot import dashboard
-from ..utils import list_standard_variables
+from ..utils.lists import list_standard_variables
 
 
 class ArgoDataFetcherProto(ABC):
diff --git a/argopy/fetchers.py b/argopy/fetchers.py
index 50b142df..18d57af6 100755
--- a/argopy/fetchers.py
+++ b/argopy/fetchers.py
@@ -15,19 +15,20 @@
 import numpy as np
 import logging
 
-from argopy.options import OPTIONS, _VALIDATORS
+from .options import OPTIONS, _VALIDATORS
 from .errors import InvalidFetcherAccessPoint, InvalidFetcher, OptionValueError
-
-from .utilities import (
-    list_available_data_src,
-    list_available_index_src,
+from .related import (
     get_coriolis_profile_id,
 )
-from .utils import (
+from .utils.checkers import (
     is_box,
     is_indexbox,
     check_wmo,
-    check_cyc,
+    check_cyc
+)
+from .utils.lists import (
+    list_available_data_src,
+    list_available_index_src,
 )
 from .plot import plot_trajectory, bar_plot, open_sat_altim_report
 
diff --git a/argopy/options.py b/argopy/options.py
index 6bf99773..0e6de5cb 100644
--- a/argopy/options.py
+++ b/argopy/options.py
@@ -5,13 +5,13 @@
 # https://github.com/pydata/xarray/blob/cafab46aac8f7a073a32ec5aa47e213a9810ed54/xarray/core/options.py
 """
 import os
-from argopy.errors import OptionValueError, FtpPathError, ErddapPathError
 import warnings
 import logging
 import fsspec
 from fsspec.core import split_protocol
 from socket import gaierror
 from urllib.parse import urlparse
+from .errors import OptionValueError, FtpPathError, ErddapPathError
 
 
 # Define a logger
diff --git a/argopy/plot/argo_colors.py b/argopy/plot/argo_colors.py
index b7a3062e..33f9c4e1 100644
--- a/argopy/plot/argo_colors.py
+++ b/argopy/plot/argo_colors.py
@@ -1,7 +1,7 @@
 import numpy as np
 from packaging import version
 from .utils import has_mpl, has_seaborn
-from ..utilities import warnUnless
+from ..utils.loggers import warnUnless
 
 if has_mpl:
     from .utils import mpl, cm, mcolors, plt
diff --git a/argopy/plot/dashboards.py b/argopy/plot/dashboards.py
index 5f95d0f2..5fbf31b7 100644
--- a/argopy/plot/dashboards.py
+++ b/argopy/plot/dashboards.py
@@ -11,7 +11,8 @@
 from packaging import version
 
 from .utils import has_ipython
-from ..utilities import warnUnless, get_ea_profile_page
+from ..utils.loggers import warnUnless
+from ..related.euroargo_api import get_ea_profile_page
 from ..utils import check_wmo, check_cyc
 from ..errors import InvalidDashboard
 from .. import __version__ as argopy_version
diff --git a/argopy/plot/plot.py b/argopy/plot/plot.py
index 22248777..7e8c1469 100644
--- a/argopy/plot/plot.py
+++ b/argopy/plot/plot.py
@@ -18,8 +18,8 @@
 from .utils import axes_style, latlongrid, land_feature
 from .argo_colors import ArgoColors
 
-from ..utilities import warnUnless
-from ..utils import check_wmo
+from ..utils.loggers import warnUnless
+from ..utils.checkers import check_wmo
 from ..errors import InvalidDatasetStructure
 
 if has_mpl:
diff --git a/argopy/plot/utils.py b/argopy/plot/utils.py
index d4ca7577..234d7710 100644
--- a/argopy/plot/utils.py
+++ b/argopy/plot/utils.py
@@ -1,7 +1,7 @@
 import numpy as np
 from contextlib import contextmanager
 import importlib
-from ..utilities import deprecated
+from ..utils.decorators import deprecated
 
 
 def _importorskip(modname):
diff --git a/argopy/related/euroargo_api.py b/argopy/related/euroargo_api.py
index b9e9b8b6..a1bbf173 100644
--- a/argopy/related/euroargo_api.py
+++ b/argopy/related/euroargo_api.py
@@ -1,6 +1,6 @@
 import pandas as pd
 from ..options import OPTIONS
-from ..utils import check_wmo, check_cyc
+from ..utils.checkers import check_wmo, check_cyc
 from ..stores import httpstore
 
 
diff --git a/argopy/related/topography.py b/argopy/related/topography.py
index dde36773..c03b7618 100644
--- a/argopy/related/topography.py
+++ b/argopy/related/topography.py
@@ -1,7 +1,7 @@
 from typing import Union
 from ..options import OPTIONS
 from ..stores import httpstore
-from ..utilities import format_oneline
+from ..utils.format import format_oneline
 
 
 class TopoFetcher:
diff --git a/argopy/stores/__init__.py b/argopy/stores/__init__.py
index d5f892d9..498210e4 100644
--- a/argopy/stores/__init__.py
+++ b/argopy/stores/__init__.py
@@ -1,4 +1,4 @@
-from .argo_index_deprec import indexstore, indexfilter_wmo, indexfilter_box
+# from .argo_index_deprec import indexstore, indexfilter_wmo, indexfilter_box
 from .filesystems import filestore, httpstore, memorystore, ftpstore
 from .filesystems import httpstore_erddap, httpstore_erddap_auth
 
diff --git a/argopy/stores/argo_index_pa.py b/argopy/stores/argo_index_pa.py
index df17b348..239034b9 100644
--- a/argopy/stores/argo_index_pa.py
+++ b/argopy/stores/argo_index_pa.py
@@ -11,9 +11,6 @@
 import gzip
 from packaging import version
 
-from ..errors import DataNotFound, InvalidDatasetStructure
-from ..utils import check_index_cols, is_indexbox, check_wmo, check_cyc, to_list
-from .argo_index_proto import ArgoIndexStoreProto
 try:
     import pyarrow.csv as csv  # noqa: F401
     import pyarrow as pa
@@ -22,6 +19,11 @@
 except ModuleNotFoundError:
     pass
 
+from ..errors import DataNotFound, InvalidDatasetStructure
+from ..utils.checkers import check_index_cols, is_indexbox, check_wmo, check_cyc
+from ..utils.casting import to_list
+from .argo_index_proto import ArgoIndexStoreProto
+
 
 log = logging.getLogger("argopy.stores.index.pa")
 
diff --git a/argopy/stores/argo_index_pd.py b/argopy/stores/argo_index_pd.py
index 7c00fca2..37d316db 100644
--- a/argopy/stores/argo_index_pd.py
+++ b/argopy/stores/argo_index_pd.py
@@ -10,7 +10,8 @@
 import gzip
 
 from ..errors import DataNotFound, InvalidDatasetStructure
-from ..utils import check_index_cols, is_indexbox, check_wmo, check_cyc, to_list
+from ..utils.checkers import check_index_cols, is_indexbox, check_wmo, check_cyc
+from ..utils.casting import to_list
 from .argo_index_proto import ArgoIndexStoreProto
 
 
diff --git a/argopy/stores/argo_index_proto.py b/argopy/stores/argo_index_proto.py
index 48e82180..8257683f 100644
--- a/argopy/stores/argo_index_proto.py
+++ b/argopy/stores/argo_index_proto.py
@@ -13,7 +13,8 @@
 
 from ..options import OPTIONS
 from ..errors import FtpPathError, InvalidDataset, OptionValueError
-from ..utils import Registry, isconnected
+from ..utils.checkers import isconnected
+from ..utils.accessories import Registry
 from .filesystems import httpstore, memorystore, filestore, ftpstore
 
 try:
diff --git a/argopy/stores/filesystems.py b/argopy/stores/filesystems.py
index 0bdbe997..28a665aa 100644
--- a/argopy/stores/filesystems.py
+++ b/argopy/stores/filesystems.py
@@ -34,7 +34,7 @@
 from typing import Union
 from urllib.parse import urlparse, parse_qs
 from functools import lru_cache
-
+from abc import ABC, abstractmethod
 import concurrent.futures
 import multiprocessing
 
@@ -47,13 +47,12 @@
     ErddapHTTPUnauthorized,
     ErddapHTTPNotFound,
 )
-from abc import ABC, abstractmethod
-from ..utils import (
+from ..utils.transform import (
     drop_variables_not_in_all_datasets,
     fill_variables_not_in_all_datasets,
 )
-from ..utils import MonitoredThreadPoolExecutor as MyExecutor
-from ..utils import Registry
+from ..utils.monitored_threadpool import MyThreadPoolExecutor as MyExecutor
+from ..utils.accessories import Registry
 
 
 log = logging.getLogger("argopy.stores")
diff --git a/argopy/tests/test_fetchers_data_argovis.py b/argopy/tests/test_fetchers_data_argovis.py
index 1db64d2b..d6f6f119 100644
--- a/argopy/tests/test_fetchers_data_argovis.py
+++ b/argopy/tests/test_fetchers_data_argovis.py
@@ -13,7 +13,7 @@
     CacheFileNotFound,
     FileSystemHasNoCache,
 )
-from argopy.utils import is_list_of_strings
+from argopy.utils.checkers import is_list_of_strings
 from utils import requires_connected_argovis, safe_to_server_errors
 
 
diff --git a/argopy/tests/test_fetchers_data_erddap.py b/argopy/tests/test_fetchers_data_erddap.py
index eecf96a2..d57375ca 100644
--- a/argopy/tests/test_fetchers_data_erddap.py
+++ b/argopy/tests/test_fetchers_data_erddap.py
@@ -1,7 +1,7 @@
 import logging
 
 from argopy import DataFetcher as ArgoDataFetcher
-from argopy.utils import is_list_of_strings
+from argopy.utils.checkers import is_list_of_strings
 
 import pytest
 import xarray as xr
diff --git a/argopy/tests/test_fetchers_data_erddap_bgc.py b/argopy/tests/test_fetchers_data_erddap_bgc.py
index d3696e0a..ad0769b6 100644
--- a/argopy/tests/test_fetchers_data_erddap_bgc.py
+++ b/argopy/tests/test_fetchers_data_erddap_bgc.py
@@ -2,7 +2,7 @@
 import numpy as np
 
 from argopy import DataFetcher as ArgoDataFetcher
-from argopy.utils import is_list_of_strings
+from argopy.utils.checkers import is_list_of_strings
 from argopy.stores import indexstore_pd as ArgoIndex  # make sure to work with the Pandas index store with erddap-bgc
 
 import pytest
diff --git a/argopy/tests/test_fetchers_data_gdac.py b/argopy/tests/test_fetchers_data_gdac.py
index 94faa7af..9bae3ee1 100644
--- a/argopy/tests/test_fetchers_data_gdac.py
+++ b/argopy/tests/test_fetchers_data_gdac.py
@@ -11,6 +11,7 @@
 import shutil
 from urllib.parse import urlparse
 import logging
+from collections import ChainMap
 
 import argopy
 from argopy import DataFetcher as ArgoDataFetcher
@@ -19,11 +20,9 @@
     FileSystemHasNoCache,
     FtpPathError,
 )
-from argopy.utilities import isconnected
-from argopy.utils import is_list_of_strings
+from argopy.utils.checkers import isconnected, is_list_of_strings
 from utils import requires_gdac
 from mocked_http import mocked_httpserver, mocked_server_address
-from collections import ChainMap
 
 
 log = logging.getLogger("argopy.tests.data.gdac")
diff --git a/argopy/tests/test_fetchers_index_gdac.py b/argopy/tests/test_fetchers_index_gdac.py
index d5f23200..02e71e92 100644
--- a/argopy/tests/test_fetchers_index_gdac.py
+++ b/argopy/tests/test_fetchers_index_gdac.py
@@ -13,8 +13,7 @@
     FileSystemHasNoCache,
     FtpPathError
 )
-from argopy.utilities import isconnected
-from argopy.utils import is_list_of_strings
+from argopy.utils.checkers import isconnected, is_list_of_strings
 from utils import requires_gdac
 from mocked_http import mocked_httpserver, mocked_server_address
 
diff --git a/argopy/tests/test_plot_argo_colors.py b/argopy/tests/test_plot_argo_colors.py
index 99f8bad1..5613ff2b 100644
--- a/argopy/tests/test_plot_argo_colors.py
+++ b/argopy/tests/test_plot_argo_colors.py
@@ -4,7 +4,6 @@
 """
 import pytest
 import logging
-import warnings
 
 from utils import (
     requires_matplotlib,
@@ -12,7 +11,7 @@
     has_matplotlib,
     has_seaborn,
 )
-from ..plot import ArgoColors
+from argopy.plot import ArgoColors
 
 if has_matplotlib:
     import matplotlib as mpl
diff --git a/argopy/tests/test_plot_plot.py b/argopy/tests/test_plot_plot.py
index a3db3903..f05bdfe1 100644
--- a/argopy/tests/test_plot_plot.py
+++ b/argopy/tests/test_plot_plot.py
@@ -19,7 +19,7 @@
     has_ipywidgets,
 )
 
-from ..plot import bar_plot, plot_trajectory, open_sat_altim_report, scatter_map
+from argopy.plot import bar_plot, plot_trajectory, open_sat_altim_report, scatter_map
 from argopy.errors import InvalidDatasetStructure
 from argopy import DataFetcher as ArgoDataFetcher
 from mocked_http import mocked_server_address
diff --git a/argopy/tests/test_plotters.py b/argopy/tests/test_plotters.py
deleted file mode 100644
index 8d662357..00000000
--- a/argopy/tests/test_plotters.py
+++ /dev/null
@@ -1,35 +0,0 @@
-"""
-This file covers the plotters module
-We test plotting functions from IndexFetcher and DataFetcher
-"""
-import pytest
-import logging
-from typing import Callable
-
-import argopy
-from argopy.errors import InvalidDashboard
-from utils import (
-    requires_gdac,
-    requires_connection,
-    requires_matplotlib,
-    requires_ipython,
-    requires_cartopy,
-    has_matplotlib,
-    has_seaborn,
-    has_cartopy,
-    has_ipython,
-    has_ipywidgets,
-)
-from ..plot import bar_plot, plot_trajectory, open_sat_altim_report, scatter_map
-from argopy import DataFetcher as ArgoDataFetcher
-
-if has_matplotlib:
-    import matplotlib as mpl
-
-if has_cartopy:
-    import cartopy
-
-if has_ipython:
-    import IPython
-
-log = logging.getLogger("argopy.tests.plot")
diff --git a/argopy/tests/test_stores_fsspec.py b/argopy/tests/test_stores_fsspec.py
index b2766d5b..29fbb475 100644
--- a/argopy/tests/test_stores_fsspec.py
+++ b/argopy/tests/test_stores_fsspec.py
@@ -29,10 +29,8 @@
     InvalidMethod,
     DataNotFound,
 )
-from argopy.utilities import (
-    modified_environ,
-)
-from argopy.utils import (
+from argopy.utils.locals import modified_environ
+from argopy.utils.checkers import (
     is_list_of_datasets,
     is_list_of_dicts,
 )
diff --git a/argopy/tests/test_stores_index.py b/argopy/tests/test_stores_index.py
index 36823bf0..eb42283f 100644
--- a/argopy/tests/test_stores_index.py
+++ b/argopy/tests/test_stores_index.py
@@ -16,9 +16,7 @@
     OptionValueError,
     InvalidDatasetStructure,
 )
-from argopy.utils import (
-    is_list_of_strings,
-)
+from argopy.utils.checkers import is_list_of_strings
 from argopy.stores.argo_index_pd import indexstore_pandas
 from mocked_http import mocked_httpserver, mocked_server_address
 
diff --git a/argopy/tests/test_utilities.py b/argopy/tests/test_utilities.py
deleted file mode 100644
index 508c617f..00000000
--- a/argopy/tests/test_utilities.py
+++ /dev/null
@@ -1,35 +0,0 @@
-import os
-import pytest
-import tempfile
-import xarray as xr
-import pandas as pd
-import numpy as np
-import types
-
-import argopy
-from argopy.utilities import (
-    linear_interpolation_remap,
-    format_oneline,
-    wmo2box,
-    wrap_longitude,
-    toYearFraction, YearFraction_to_datetime,
-    argo_split_path,
-    get_coriolis_profile_id,
-    get_ea_profile_page,
-)
-from argopy.utils import (
-    is_box,
-    is_list_of_strings,
-)
-from argopy.errors import InvalidFetcherAccessPoint, FtpPathError
-from argopy import DataFetcher as ArgoDataFetcher
-from utils import (
-    requires_connection,
-    requires_erddap,
-    requires_gdac,
-)
-from mocked_http import mocked_httpserver, mocked_server_address
-
-
-
-
diff --git a/argopy/tests/test_utils_caching.py b/argopy/tests/test_utils_caching.py
index 59472072..e0841fdb 100644
--- a/argopy/tests/test_utils_caching.py
+++ b/argopy/tests/test_utils_caching.py
@@ -1,11 +1,12 @@
 import os
 import pandas as pd
 import argopy
+import tempfile
 from argopy import DataFetcher as ArgoDataFetcher
 from utils import (
     requires_gdac,
 )
-import tempfile
+from argopy.utils.caching import lscache, clear_cache
 
 
 @requires_gdac
@@ -15,7 +16,7 @@ def test_clear_cache():
         with argopy.set_options(cachedir=cachedir):
             loader = ArgoDataFetcher(src="gdac", ftp=ftproot, cache=True).profile(2902696, 12)
             loader.to_xarray()
-            argopy.clear_cache()
+            clear_cache()
             assert os.path.exists(cachedir) is True
             assert len(os.listdir(cachedir)) == 0
 
@@ -27,9 +28,9 @@ def test_lscache():
         with argopy.set_options(cachedir=cachedir):
             loader = ArgoDataFetcher(src="gdac", ftp=ftproot, cache=True).profile(2902696, 12)
             loader.to_xarray()
-            result = argopy.utilities.lscache(cache_path=cachedir, prt=True)
+            result = lscache(cache_path=cachedir, prt=True)
             assert isinstance(result, str)
 
-            result = argopy.utilities.lscache(cache_path=cachedir, prt=False)
+            result = lscache(cache_path=cachedir, prt=False)
             assert isinstance(result, pd.DataFrame)
 
diff --git a/argopy/tests/test_utils_locals.py b/argopy/tests/test_utils_locals.py
index fa04418d..4ad32bfd 100644
--- a/argopy/tests/test_utils_locals.py
+++ b/argopy/tests/test_utils_locals.py
@@ -2,7 +2,7 @@
 import pytest
 import io
 import argopy
-from ..utils.locals import modified_environ
+from argopy.utils.locals import modified_environ
 
 
 @pytest.mark.parametrize("conda", [False, True],
diff --git a/argopy/tests/test_xarray_engine.py b/argopy/tests/test_xarray_engine.py
index 0bf655d8..b67701f0 100644
--- a/argopy/tests/test_xarray_engine.py
+++ b/argopy/tests/test_xarray_engine.py
@@ -4,7 +4,7 @@
 import logging
 import warnings
 import argopy
-from argopy.utilities import argo_split_path
+from argopy.utils.format import argo_split_path
 
 log = logging.getLogger("argopy.tests.xarray.engine")
 
diff --git a/argopy/tutorial.py b/argopy/tutorial.py
index b619f3bb..37762764 100644
--- a/argopy/tutorial.py
+++ b/argopy/tutorial.py
@@ -20,6 +20,7 @@
 from urllib.request import urlretrieve
 import shutil
 
+
 _DEFAULT_CACHE_DIR = os.path.expanduser(os.path.sep.join(["~", ".argopy_tutorial_data"]))
 
 
diff --git a/argopy/utilities.py b/argopy/utilities.py
new file mode 100644
index 00000000..36c85294
--- /dev/null
+++ b/argopy/utilities.py
@@ -0,0 +1,22 @@
+import warnings
+warnings.filterwarnings("default", category=DeprecationWarning, module=__name__)
+
+
+def deprecation_of_utilities():
+    warnings.warn(
+        "The 'argopy.utilities' module has been replaced by 'argopy.utils'. After 0.1.15, importing 'utilities' "
+        "will raise an error. You're seeing this message because you called this function through "
+        "the argopy 'utilities' module.",
+        category=DeprecationWarning,
+        stacklevel=2,
+    )
+
+
+def show_versions(*args, **kwargs):
+    deprecation_of_utilities()
+    from .utils.locals import show_versions
+    return show_versions(*args, **kwargs)
+
+
+if __name__ == "argopy.utilities":
+    deprecation_of_utilities()
diff --git a/argopy/utils/__init__.py b/argopy/utils/__init__.py
index d1f74d67..7d31c38c 100644
--- a/argopy/utils/__init__.py
+++ b/argopy/utils/__init__.py
@@ -24,7 +24,7 @@
 from .monitors import monitor_status
 from .geo import wmo2box, wrap_longitude, toYearFraction, YearFraction_to_datetime
 from .compute import linear_interpolation_remap, groupby_remap
-from .manip import fill_variables_not_in_all_datasets, drop_variables_not_in_all_datasets
+from .transform import fill_variables_not_in_all_datasets, drop_variables_not_in_all_datasets
 from .format import argo_split_path, format_oneline
 
 
diff --git a/argopy/utils/casting.py b/argopy/utils/casting.py
index eafae65a..80ab99cf 100644
--- a/argopy/utils/casting.py
+++ b/argopy/utils/casting.py
@@ -6,6 +6,8 @@
 import importlib
 import json
 
+from .decorators import deprecated
+
 path2assets = importlib.util.find_spec('argopy.static.assets').submodule_search_locations[0]
 
 with open(os.path.join(path2assets, "data_types.json"), "r") as f:
diff --git a/argopy/utils/checkers.py b/argopy/utils/checkers.py
index b3f2f977..bab13401 100644
--- a/argopy/utils/checkers.py
+++ b/argopy/utils/checkers.py
@@ -12,10 +12,9 @@
 import logging
 
 from ..options import OPTIONS
-from ..stores import httpstore
-from ..utils import to_list
 from ..errors import InvalidDatasetStructure, FtpPathError, InvalidFetcher
-from . import list_available_data_src, list_available_index_src
+from .lists import list_available_data_src, list_available_index_src
+from .casting import to_list
 
 
 log = logging.getLogger("argopy.utils.checkers")
@@ -614,6 +613,7 @@ def erddap_ds_exists(
         erddap = OPTIONS['erddap']
     # log.debug("from erddap_ds_exists: %s" % erddap)
     if isconnected(erddap, maxtry=maxtry):
+        from ..stores import httpstore
         with httpstore(timeout=OPTIONS['api_timeout']).open("".join([erddap, "/info/index.json"])) as of:
             erddap_index = json.load(of)
         if is_list_of_strings(ds):
diff --git a/argopy/utils/chunking.py b/argopy/utils/chunking.py
index 4ff7459f..2b72fe52 100644
--- a/argopy/utils/chunking.py
+++ b/argopy/utils/chunking.py
@@ -2,7 +2,7 @@
 import pandas as pd
 from functools import reduce
 from ..errors import InvalidFetcherAccessPoint
-from . import is_box
+from .checkers import is_box
 
 import collections
 try:
diff --git a/argopy/utils/compute.py b/argopy/utils/compute.py
index 6209034c..8a89eebb 100644
--- a/argopy/utils/compute.py
+++ b/argopy/utils/compute.py
@@ -1,3 +1,7 @@
+"""
+Mathematically or statistically compute something output of xarray objects
+"""
+
 import numpy as np
 from scipy import interpolate
 import xarray as xr
diff --git a/argopy/utils/format.py b/argopy/utils/format.py
index 9ffd9ab6..85a10bf8 100644
--- a/argopy/utils/format.py
+++ b/argopy/utils/format.py
@@ -1,3 +1,6 @@
+"""
+Manipulate Argo formatted string and print/stdout formatters
+"""
 import os
 from urllib.parse import urlparse
 import logging
diff --git a/argopy/xarray.py b/argopy/xarray.py
index 8acc7b1c..386c8507 100644
--- a/argopy/xarray.py
+++ b/argopy/xarray.py
@@ -14,14 +14,16 @@
 except ModuleNotFoundError:
     with_gsw = False
 
-from .utils import (
-    is_list_of_strings,
+from .utils.checkers import is_list_of_strings
+from .utils.casting import (
     cast_Argo_variable_type,
     DATA_TYPES,
+)
+from .utils.compute import (
     linear_interpolation_remap,
     groupby_remap,
-    toYearFraction,
 )
+from .utils.geo import toYearFraction
 from .errors import InvalidDatasetStructure, DataNotFound, OptionValueError
 
 

From 459846f29a86dcebdcd64ea21c5f711fe78287d6 Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Mon, 11 Sep 2023 15:56:35 +0200
Subject: [PATCH 21/33] import fix

---
 argopy/tests/helpers/utils.py | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/argopy/tests/helpers/utils.py b/argopy/tests/helpers/utils.py
index 648b3fdf..e688c589 100644
--- a/argopy/tests/helpers/utils.py
+++ b/argopy/tests/helpers/utils.py
@@ -19,16 +19,19 @@
 import asyncio
 from packaging import version
 import warnings
+import logging
+
 from argopy.options import set_options
 from argopy.errors import ErddapServerError, ArgovisServerError, DataNotFound, FtpPathError
-from argopy.utilities import (
+from argopy.utils.lists import (
     list_available_data_src,
     list_available_index_src,
+)
+from argopy.utils.checkers import (
     isconnected,
     erddap_ds_exists,
     isAPIconnected,
 )
-import logging
 from mocked_http import mocked_server_address, serve_mocked_httpserver
 
 

From 463e75190cacce6bb971d36af44185a8aad993c0 Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Tue, 12 Sep 2023 11:48:44 +0200
Subject: [PATCH 22/33] Deprec messages in argopy.utilities

warning message, ensure backward compatibility until 0.1.15
---
 argopy/__init__.py       |   7 +-
 argopy/utilities.py      | 306 +++++++++++++++++++++++++++++++++++++--
 argopy/utils/__init__.py |  10 +-
 3 files changed, 305 insertions(+), 18 deletions(-)

diff --git a/argopy/__init__.py b/argopy/__init__.py
index dc71b2db..1817a206 100644
--- a/argopy/__init__.py
+++ b/argopy/__init__.py
@@ -26,13 +26,14 @@
 from .fetchers import ArgoIndexFetcher as IndexFetcher  # noqa: E402
 
 from .xarray import ArgoAccessor  # noqa: E402
-from . import tutorial  # noqa: E402
 
 # Other Import
-from . import utils as utilities  # noqa: E402
+# from . import utils as utilities  # noqa: E402
+from . import utilities  # noqa: E402  # being deprecated until 0.1.15, then remove
 from . import stores  # noqa: E402
 from . import errors  # noqa: E402
 from . import plot  # noqa: E402
+from . import tutorial  # noqa: E402
 from .plot import dashboard, ArgoColors  # noqa: E402
 from .options import set_options, reset_options  # noqa: E402
 from .data_fetchers import CTDRefDataFetcher  # noqa: E402
@@ -71,7 +72,7 @@
     "ArgoDOI",  # Class
 
     # Submodules:
-    "utilities",  # todo: send a deprecation warning when using argopy.utilities
+    "utilities",  # being deprecated until 0.1.15, then remove
     "errors",
     "plot",
     "ArgoColors",  # Class
diff --git a/argopy/utilities.py b/argopy/utilities.py
index 36c85294..33b35c67 100644
--- a/argopy/utilities.py
+++ b/argopy/utilities.py
@@ -1,22 +1,304 @@
 import warnings
+import importlib
+import inspect
+from functools import wraps
+
 warnings.filterwarnings("default", category=DeprecationWarning, module=__name__)
 
 
-def deprecation_of_utilities():
-    warnings.warn(
-        "The 'argopy.utilities' module has been replaced by 'argopy.utils'. After 0.1.15, importing 'utilities' "
-        "will raise an error. You're seeing this message because you called this function through "
-        "the argopy 'utilities' module.",
-        category=DeprecationWarning,
-        stacklevel=2,
-    )
+def refactored(func1):
+
+    rel = importlib.import_module('argopy.related')
+    utils = importlib.import_module('argopy.utils')
+    in_related = hasattr(rel, func1.__name__)
+    func2 = getattr(rel, func1.__name__) if in_related else getattr(utils, func1.__name__)
+
+    func1_type = 'function'
+    if inspect.isclass(func1):
+        func1_type = 'class'
+
+    func2_loc = 'utils'
+    if in_related:
+        func2_loc = 'related'
+
+    msg = "The 'argopy.utilities.{name}' {ftype} has moved to 'argopy.{where}.{name}'. \
+You're seeing this message because you called '{name}' imported from 'argopy.utilities'. \
+Please update your script to import '{name}' from 'argopy.{where}'. \
+After 0.1.15, importing 'utilities' will raise an error."
+
+    @wraps(func1)
+    def decorator(*args, **kwargs):
+        # warnings.simplefilter('always', DeprecationWarning)
+        warnings.warn(
+            msg.format(name=func1.__name__, ftype=func1_type, where=func2_loc),
+            category=DeprecationWarning,
+            stacklevel=2
+        )
+        # warnings.simplefilter('default', DeprecationWarning)
+        return func2(*args, **kwargs)
+
+    return decorator
+
+# Argo related dataset and Meta-data fetchers
+
+@refactored
+class TopoFetcher:
+    pass
+
+@refactored
+class ArgoDocs:
+    pass
+
+@refactored
+class ArgoNVSReferenceTables:
+    pass
+
+@refactored
+class OceanOPSDeployments:
+    pass
+
+@refactored
+def get_coriolis_profile_id(*args, **kwargs):
+    pass
+
+@refactored
+def get_ea_profile_page(*args, **kwargs):
+    pass
+
+@refactored
+def load_dict(*args, **kwargs):
+    pass
+
+@refactored
+def mapp_dict(*args, **kwargs):
+    pass
+
+# Checkers
+@refactored
+def is_box(*args, **kwargs):
+    pass
+
+@refactored
+def is_indexbox(*args, **kwargs):
+    pass
+
+@refactored
+def is_list_of_strings(*args, **kwargs):
+    pass
+
+@refactored
+def is_list_of_dicts(*args, **kwargs):
+    pass
+
+@refactored
+def is_list_of_datasets(*args, **kwargs):
+    pass
+
+@refactored
+def is_list_equal(*args, **kwargs):
+    pass
+
+@refactored
+def check_wmo(*args, **kwargs):
+    pass
+
+@refactored
+def is_wmo(*args, **kwargs):
+    pass
+
+@refactored
+def check_cyc(*args, **kwargs):
+    pass
+
+@refactored
+def is_cyc(*args, **kwargs):
+    pass
+
+@refactored
+def check_index_cols(*args, **kwargs):
+    pass
+
+@refactored
+def check_gdac_path(*args, **kwargs):
+    pass
+
+@refactored
+def isconnected(*args, **kwargs):
+    pass
+
+@refactored
+def isalive(*args, **kwargs):
+    pass
+
+@refactored
+def isAPIconnected(*args, **kwargs):
+    pass
+
+@refactored
+def erddap_ds_exists(*args, **kwargs):
+    pass
+
+@refactored
+def urlhaskeyword(*args, **kwargs):
+    pass
+
+
+# Data type casting:
+
+@refactored
+def to_list(*args, **kwargs):
+    pass
 
+@refactored
+def cast_Argo_variable_type(*args, **kwargs):
+    pass
 
+
+# Decorators
+
+@refactored
+def deprecated(*args, **kwargs):
+    pass
+
+@refactored
+def doc_inherit(*args, **kwargs):
+    pass
+
+# Lists:
+
+@refactored
+def list_available_data_src(*args, **kwargs):
+    pass
+
+@refactored
+def list_available_index_src(*args, **kwargs):
+    pass
+
+@refactored
+def list_standard_variables(*args, **kwargs):
+    pass
+
+@refactored
+def list_multiprofile_file_variables(*args, **kwargs):
+    pass
+
+# Cache management:
+@refactored
+def clear_cache(*args, **kwargs):
+    pass
+
+@refactored
+def lscache(*args, **kwargs):
+    pass
+
+# Computation and performances:
+@refactored
+class Chunker:
+    pass
+
+# Accessories classes (specific objects):
+@refactored
+class float_wmo:
+    pass
+
+@refactored
+class Registry:
+    pass
+
+# Locals (environments, versions, systems):
+@refactored
+def get_sys_info(*args, **kwargs):
+    pass
+
+@refactored
+def netcdf_and_hdf5_versions(*args, **kwargs):
+    pass
+
+@refactored
 def show_versions(*args, **kwargs):
-    deprecation_of_utilities()
-    from .utils.locals import show_versions
-    return show_versions(*args, **kwargs)
+    pass
+
+@refactored
+def show_options(*args, **kwargs):
+    pass
+
+@refactored
+def modified_environ(*args, **kwargs):
+    pass
+
+
+# Monitors
+@refactored
+def badge(*args, **kwargs):
+    pass
 
+@refactored
+class fetch_status:
+    pass
+
+@refactored
+class monitor_status:
+    pass
+
+# Geo (space/time data utilities)
+@refactored
+def toYearFraction(*args, **kwargs):
+    pass
+
+@refactored
+def YearFraction_to_datetime(*args, **kwargs):
+    pass
+
+@refactored
+def wrap_longitude(*args, **kwargs):
+    pass
+
+@refactored
+def wmo2box(*args, **kwargs):
+    pass
+
+# Computation with datasets:
+@refactored
+def linear_interpolation_remap(*args, **kwargs):
+    pass
+
+@refactored
+def groupby_remap(*args, **kwargs):
+    pass
+
+# Manipulate datasets:
+@refactored
+def drop_variables_not_in_all_datasets(*args, **kwargs):
+    pass
+
+@refactored
+def fill_variables_not_in_all_datasets(*args, **kwargs):
+    pass
+
+# Formatters:
+@refactored
+def format_oneline(*args, **kwargs):
+    pass
+
+@refactored
+def argo_split_path(*args, **kwargs):
+    pass
+
+
+# Loggers
+@refactored
+def warnUnless(*args, **kwargs):
+    pass
+
+@refactored
+def log_argopy_callerstack(*args, **kwargs):
+    pass
 
 if __name__ == "argopy.utilities":
-    deprecation_of_utilities()
+    warnings.warn(
+        "The 'argopy.utilities' has moved to 'argopy.utils'. After 0.1.15, importing 'utilities' "
+        "will raise an error. Please update your script.",
+        category=DeprecationWarning,
+        stacklevel=2,
+    )
+
diff --git a/argopy/utils/__init__.py b/argopy/utils/__init__.py
index 7d31c38c..60dc89db 100644
--- a/argopy/utils/__init__.py
+++ b/argopy/utils/__init__.py
@@ -20,13 +20,13 @@
 from .monitored_threadpool import MyThreadPoolExecutor as MonitoredThreadPoolExecutor
 from .chunking import Chunker
 from .accessories import Registry, float_wmo
-from .locals import show_versions, show_options, modified_environ
-from .monitors import monitor_status
+from .locals import show_versions, show_options, modified_environ, get_sys_info, netcdf_and_hdf5_versions
+from .monitors import monitor_status, badge, fetch_status
 from .geo import wmo2box, wrap_longitude, toYearFraction, YearFraction_to_datetime
 from .compute import linear_interpolation_remap, groupby_remap
 from .transform import fill_variables_not_in_all_datasets, drop_variables_not_in_all_datasets
 from .format import argo_split_path, format_oneline
-
+from .loggers import warnUnless, log_argopy_callerstack
 
 __all__ = (
     # Checkers:
@@ -88,4 +88,8 @@
     # Formatters:
     "format_oneline",
     "argo_split_path",
+
+    # Loggers:
+    "warnUnless", "log_argopy_callerstack",
+
 )

From 0b6b9e938188a9f3de095b21dae1ce69f3751da1 Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Tue, 12 Sep 2023 14:02:29 +0200
Subject: [PATCH 23/33] Black new utils files

---
 argopy/utils/__init__.py    |  78 ++++++----
 argopy/utils/accessories.py |  23 +--
 argopy/utils/caching.py     |  67 +++++----
 argopy/utils/casting.py     |  91 +++++++-----
 argopy/utils/checkers.py    | 282 ++++++++++++++++++++----------------
 argopy/utils/chunking.py    |  19 +--
 argopy/utils/compute.py     |   7 +-
 argopy/utils/decorators.py  |  21 +--
 argopy/utils/format.py      | 162 +++++++++++----------
 argopy/utils/geo.py         |  45 +++---
 argopy/utils/lists.py       |  35 +++--
 argopy/utils/locals.py      | 149 +++++++++++--------
 argopy/utils/loggers.py     |   9 +-
 argopy/utils/monitors.py    |  32 ++--
 argopy/utils/transform.py   |  24 ++-
 15 files changed, 591 insertions(+), 453 deletions(-)

diff --git a/argopy/utils/__init__.py b/argopy/utils/__init__.py
index 60dc89db..0d1b9b6e 100644
--- a/argopy/utils/__init__.py
+++ b/argopy/utils/__init__.py
@@ -1,12 +1,21 @@
 from .checkers import (
-    is_box, is_indexbox,
-    is_list_of_strings, is_list_of_dicts, is_list_of_datasets, is_list_equal,
-    is_wmo, check_wmo,
-    is_cyc, check_cyc,
+    is_box,
+    is_indexbox,
+    is_list_of_strings,
+    is_list_of_dicts,
+    is_list_of_datasets,
+    is_list_equal,
+    is_wmo,
+    check_wmo,
+    is_cyc,
+    check_cyc,
     check_index_cols,
     check_gdac_path,
-    isconnected, urlhaskeyword,
-    isalive, isAPIconnected, erddap_ds_exists,
+    isconnected,
+    urlhaskeyword,
+    isalive,
+    isAPIconnected,
+    erddap_ds_exists,
 )
 from .casting import DATA_TYPES, cast_Argo_variable_type, to_list
 from .decorators import deprecated, doc_inherit
@@ -14,82 +23,89 @@
     list_available_data_src,
     list_available_index_src,
     list_standard_variables,
-    list_multiprofile_file_variables
+    list_multiprofile_file_variables,
 )
 from .caching import clear_cache, lscache
 from .monitored_threadpool import MyThreadPoolExecutor as MonitoredThreadPoolExecutor
 from .chunking import Chunker
 from .accessories import Registry, float_wmo
-from .locals import show_versions, show_options, modified_environ, get_sys_info, netcdf_and_hdf5_versions
+from .locals import (
+    show_versions,
+    show_options,
+    modified_environ,
+    get_sys_info,
+    netcdf_and_hdf5_versions,
+)
 from .monitors import monitor_status, badge, fetch_status
 from .geo import wmo2box, wrap_longitude, toYearFraction, YearFraction_to_datetime
 from .compute import linear_interpolation_remap, groupby_remap
-from .transform import fill_variables_not_in_all_datasets, drop_variables_not_in_all_datasets
+from .transform import (
+    fill_variables_not_in_all_datasets,
+    drop_variables_not_in_all_datasets,
+)
 from .format import argo_split_path, format_oneline
 from .loggers import warnUnless, log_argopy_callerstack
 
 __all__ = (
     # Checkers:
-    "is_box", "is_indexbox",
-    "is_list_of_strings", "is_list_of_dicts", "is_list_of_datasets", "is_list_equal",
-    "is_wmo", "check_wmo",
-    "is_cyc", "check_cyc",
+    "is_box",
+    "is_indexbox",
+    "is_list_of_strings",
+    "is_list_of_dicts",
+    "is_list_of_datasets",
+    "is_list_equal",
+    "is_wmo",
+    "check_wmo",
+    "is_cyc",
+    "check_cyc",
     "check_index_cols",
     "check_gdac_path",
-    "isconnected", "isalive", "isAPIconnected", "erddap_ds_exists",
-
+    "isconnected",
+    "isalive",
+    "isAPIconnected",
+    "erddap_ds_exists",
     # Data type casting:
     "DATA_TYPES",
     "cast_Argo_variable_type",
     "to_list",
-
     # Decorators:
     "deprecated",
     "doc_inherit",
-
     # Lists:
     "list_available_data_src",
     "list_available_index_src",
     "list_standard_variables",
     "list_multiprofile_file_variables",
-
     # Cache management:
-    "clear_cache", "lscache",
-
+    "clear_cache",
+    "lscache",
     # Computation and performances:
     "MonitoredThreadPoolExecutor",
     "Chunker",
-
     # Accessories classes (specific objects):
-    "Registry", "float_wmo",
-
+    "Registry",
+    "float_wmo",
     # Locals (environments, versions, systems):
     "show_versions",
     "show_options",
     "modified_environ",
-
     # Monitors
     "monitor_status",
-
     # Geo (space/time data utilities)
     "wmo2box",
     "wrap_longitude",
     "toYearFraction",
     "YearFraction_to_datetime",
-
     # Computation with datasets:
     "linear_interpolation_remap",
     "groupby_remap",
-
     # Manipulate datasets:
     "fill_variables_not_in_all_datasets",
     "drop_variables_not_in_all_datasets",
-
     # Formatters:
     "format_oneline",
     "argo_split_path",
-
     # Loggers:
-    "warnUnless", "log_argopy_callerstack",
-
+    "warnUnless",
+    "log_argopy_callerstack",
 )
diff --git a/argopy/utils/accessories.py b/argopy/utils/accessories.py
index 5be8c7b0..d3109c59 100644
--- a/argopy/utils/accessories.py
+++ b/argopy/utils/accessories.py
@@ -12,6 +12,7 @@
 
 class RegistryItem(ABC):
     """Prototype for possible custom items in a Registry"""
+
     @property
     @abstractmethod
     def value(self):
@@ -34,7 +35,7 @@ def __repr__(self):
 class float_wmo(RegistryItem):
     """Argo float WMO number object"""
 
-    def __init__(self, WMO_number, errors='raise'):
+    def __init__(self, WMO_number, errors="raise"):
         """Create an Argo float WMO number object
 
         Parameters
@@ -52,7 +53,9 @@ def __init__(self, WMO_number, errors='raise'):
         if isinstance(WMO_number, float_wmo):
             item = WMO_number.value
         else:
-            item = check_wmo(WMO_number, errors=self.errors)[0]  # This will automatically validate item
+            item = check_wmo(WMO_number, errors=self.errors)[
+                0
+            ]  # This will automatically validate item
         self.item = item
 
     @property
@@ -140,9 +143,9 @@ class Registry(UserList):
     """
 
     def _complain(self, msg):
-        if self._invalid == 'raise':
+        if self._invalid == "raise":
             raise ValueError(msg)
-        elif self._invalid == 'warn':
+        elif self._invalid == "warn":
             warnings.warn(msg)
         else:
             log.debug(msg)
@@ -162,7 +165,9 @@ def _dict(self, item):
     def _wmo(self, item):
         return item.isvalid
 
-    def __init__(self, initlist=None, name: str = 'unnamed', dtype='str', invalid='raise'):
+    def __init__(
+        self, initlist=None, name: str = "unnamed", dtype="str", invalid="raise"
+    ):
         """Create a registry, i.e. a controlled list
 
         Parameters
@@ -178,16 +183,16 @@ def __init__(self, initlist=None, name: str = 'unnamed', dtype='str', invalid='r
         """
         self.name = name
         self._invalid = invalid
-        if repr(dtype) == "<class 'str'>" or dtype == 'str':
+        if repr(dtype) == "<class 'str'>" or dtype == "str":
             self._validator = self._str
             self.dtype = str
-        elif dtype == float_wmo or str(dtype).lower() == 'wmo':
+        elif dtype == float_wmo or str(dtype).lower() == "wmo":
             self._validator = self._wmo
             self.dtype = float_wmo
-        elif repr(dtype) == "<class 'dict'>" or dtype == 'dict':
+        elif repr(dtype) == "<class 'dict'>" or dtype == "dict":
             self._validator = self._dict
             self.dtype = dict
-        elif hasattr(dtype, 'isvalid'):
+        elif hasattr(dtype, "isvalid"):
             self._validator = dtype.isvalid
             self.dtype = dtype
         else:
diff --git a/argopy/utils/caching.py b/argopy/utils/caching.py
index 7e257f23..5389aabd 100644
--- a/argopy/utils/caching.py
+++ b/argopy/utils/caching.py
@@ -12,7 +12,7 @@
 
 
 def clear_cache(fs=None):
-    """ Delete argopy cache folder content """
+    """Delete argopy cache folder content"""
     if os.path.exists(OPTIONS["cachedir"]):
         # shutil.rmtree(OPTIONS["cachedir"])
         for filename in os.listdir(OPTIONS["cachedir"]):
@@ -29,23 +29,24 @@ def clear_cache(fs=None):
 
 
 def lscache(cache_path: str = "", prt=True):
-    """ Decode and list cache folder content
+    """Decode and list cache folder content
 
-        Parameters
-        ----------
-        cache_path: str
-        prt: bool, default=True
-            Return a printable string or a :class:`pandas.DataFrame`
+    Parameters
+    ----------
+    cache_path: str
+    prt: bool, default=True
+        Return a printable string or a :class:`pandas.DataFrame`
 
-        Returns
-        -------
-        str or :class:`pandas.DataFrame`
+    Returns
+    -------
+    str or :class:`pandas.DataFrame`
     """
     from datetime import datetime
     import math
+
     summary = []
 
-    cache_path = OPTIONS['cachedir'] if cache_path == '' else cache_path
+    cache_path = OPTIONS["cachedir"] if cache_path == "" else cache_path
     apath = os.path.abspath(cache_path)
     log.debug("Listing cache content at: %s" % cache_path)
 
@@ -62,7 +63,9 @@ def convert_size(size_bytes):
     fn = os.path.join(apath, "cache")
     if os.path.exists(fn):
         with open(fn, "rb") as f:
-            loaded_cached_files = pickle.load(f)  # nosec B301 because files controlled internally
+            loaded_cached_files = pickle.load(
+                f
+            )  # nosec B301 because files controlled internally
             for c in loaded_cached_files.values():
                 if isinstance(c["blocks"], list):
                     c["blocks"] = set(c["blocks"])
@@ -76,38 +79,52 @@ def convert_size(size_bytes):
     N_FILES = len(cached_files)
     TOTAL_SIZE = 0
     for cfile in cached_files:
-        path = os.path.join(apath, cached_files[cfile]['fn'])
+        path = os.path.join(apath, cached_files[cfile]["fn"])
         TOTAL_SIZE += os.path.getsize(path)
 
-    summary.append("%s %s" % ("=" * 20, "%i files in fsspec cache folder (%s)" % (N_FILES, convert_size(TOTAL_SIZE))))
+    summary.append(
+        "%s %s"
+        % (
+            "=" * 20,
+            "%i files in fsspec cache folder (%s)"
+            % (N_FILES, convert_size(TOTAL_SIZE)),
+        )
+    )
     summary.append("lscache %s" % os.path.sep.join([apath, ""]))
     summary.append("=" * 20)
 
-    listing = {'fn': [], 'size': [], 'time': [], 'original': [], 'uid': [], 'blocks': []}
+    listing = {
+        "fn": [],
+        "size": [],
+        "time": [],
+        "original": [],
+        "uid": [],
+        "blocks": [],
+    }
     for cfile in cached_files:
-        summary.append("- %s" % cached_files[cfile]['fn'])
-        listing['fn'].append(cached_files[cfile]['fn'])
+        summary.append("- %s" % cached_files[cfile]["fn"])
+        listing["fn"].append(cached_files[cfile]["fn"])
 
-        path = os.path.join(cache_path, cached_files[cfile]['fn'])
-        summary.append("\t%8s: %s" % ('SIZE', convert_size(os.path.getsize(path))))
-        listing['size'].append(os.path.getsize(path))
+        path = os.path.join(cache_path, cached_files[cfile]["fn"])
+        summary.append("\t%8s: %s" % ("SIZE", convert_size(os.path.getsize(path))))
+        listing["size"].append(os.path.getsize(path))
 
-        key = 'time'
+        key = "time"
         ts = cached_files[cfile][key]
         tsf = pd.to_datetime(datetime.fromtimestamp(ts)).strftime("%c")
         summary.append("\t%8s: %s (%s)" % (key, tsf, ts))
-        listing['time'].append(pd.to_datetime(datetime.fromtimestamp(ts)))
+        listing["time"].append(pd.to_datetime(datetime.fromtimestamp(ts)))
 
         if version.parse(fsspec.__version__) > version.parse("0.8.7"):
-            key = 'original'
+            key = "original"
             summary.append("\t%8s: %s" % (key, cached_files[cfile][key]))
             listing[key].append(cached_files[cfile][key])
 
-        key = 'uid'
+        key = "uid"
         summary.append("\t%8s: %s" % (key, cached_files[cfile][key]))
         listing[key].append(cached_files[cfile][key])
 
-        key = 'blocks'
+        key = "blocks"
         summary.append("\t%8s: %s" % (key, cached_files[cfile][key]))
         listing[key].append(cached_files[cfile][key])
 
diff --git a/argopy/utils/casting.py b/argopy/utils/casting.py
index 80ab99cf..2de6ef76 100644
--- a/argopy/utils/casting.py
+++ b/argopy/utils/casting.py
@@ -5,10 +5,16 @@
 import xarray as xr
 import importlib
 import json
+import logging
 
 from .decorators import deprecated
 
-path2assets = importlib.util.find_spec('argopy.static.assets').submodule_search_locations[0]
+
+log = logging.getLogger("argopy.utils.casting")
+
+path2assets = importlib.util.find_spec(
+    "argopy.static.assets"
+).submodule_search_locations[0]
 
 with open(os.path.join(path2assets, "data_types.json"), "r") as f:
     DATA_TYPES = json.load(f)
@@ -16,7 +22,7 @@
 
 @deprecated
 def cast_types(ds):  # noqa: C901
-    """ Make sure variables are of the appropriate types according to Argo
+    """Make sure variables are of the appropriate types according to Argo
 
     #todo: This is hard coded, but should be retrieved from an API somewhere.
     Should be able to handle all possible variables encountered in the Argo dataset.
@@ -83,26 +89,30 @@ def cast_types(ds):  # noqa: C901
         "JULD_LOCATION",
         "SCIENTIFIC_CALIB_DATE",
         "HISTORY_DATE",
-        "TIME"
+        "TIME",
     ]
 
     def fix_weird_bytes(x):
         x = x.replace(b"\xb1", b"+/-")
         return x
+
     fix_weird_bytes = np.vectorize(fix_weird_bytes)
 
     def cast_this(da, type):
-        """ Low-level casting of DataArray values """
+        """Low-level casting of DataArray values"""
         try:
             da.values = da.values.astype(type)
             da.attrs["casted"] = 1
         except Exception:
-            msg = "Oops! %s occurred. Fail to cast <%s> into %s for: %s. Encountered unique values: %s" % (sys.exc_info()[0], str(da.dtype), type, da.name, str(np.unique(da)))
+            msg = (
+                "Oops! %s occurred. Fail to cast <%s> into %s for: %s. Encountered unique values: %s"
+                % (sys.exc_info()[0], str(da.dtype), type, da.name, str(np.unique(da)))
+            )
             log.debug(msg)
         return da
 
     def cast_this_da(da):
-        """ Cast any DataArray """
+        """Cast any DataArray"""
         v = da.name
         da.attrs["casted"] = 0
         if v in list_str and da.dtype == "O":  # Object
@@ -133,16 +143,16 @@ def cast_this_da(da):
                         #
                         s.values = pd.to_datetime(val, format="%Y%m%d%H%M%S")
                         da.values = s.unstack("dummy_index")
-                    da = cast_this(da, 'datetime64[s]')
+                    da = cast_this(da, "datetime64[s]")
                 else:
-                    da = cast_this(da, 'datetime64[s]')
+                    da = cast_this(da, "datetime64[s]")
 
             elif v == "SCIENTIFIC_CALIB_DATE":
                 da = cast_this(da, str)
                 s = da.stack(dummy_index=da.dims)
                 s.values = pd.to_datetime(s.values, format="%Y%m%d%H%M%S")
                 da.values = (s.unstack("dummy_index")).values
-                da = cast_this(da, 'datetime64[s]')
+                da = cast_this(da, "datetime64[s]")
 
         if "QC" in v and "PROFILE" not in v and "QCTEST" not in v:
             if da.dtype == "O":  # convert object to string
@@ -184,7 +194,7 @@ def cast_this_da(da):
             # finally convert QC strings to integers:
             da = cast_this(da, np.int32)
 
-        if da.dtype == 'O':
+        if da.dtype == "O":
             # By default, try to cast as float:
             da = cast_this(da, np.float32)
 
@@ -206,7 +216,7 @@ def cast_this_da(da):
 
 
 def cast_Argo_variable_type(ds, overwrite=True):
-    """ Ensure that all dataset variables are of the appropriate types according to Argo references
+    """Ensure that all dataset variables are of the appropriate types according to Argo references
 
     Parameter
     ---------
@@ -218,8 +228,9 @@ def cast_Argo_variable_type(ds, overwrite=True):
     -------
     :class:`xarray.DataSet`
     """
+
     def cast_this(da, type):
-        """ Low-level casting of DataArray values """
+        """Low-level casting of DataArray values"""
         try:
             da = da.astype(type)
             # with warnings.catch_warnings():
@@ -232,7 +243,10 @@ def cast_this(da, type):
             da.attrs["casted"] = 1
         except Exception:
             print("Oops!", sys.exc_info()[0], "occurred.")
-            print("Fail to cast %s[%s] from '%s' to %s" % (da.name, da.dims, da.dtype, type))
+            print(
+                "Fail to cast %s[%s] from '%s' to %s"
+                % (da.name, da.dims, da.dtype, type)
+            )
             try:
                 print("Unique values:", np.unique(da))
             except Exception:
@@ -241,41 +255,39 @@ def cast_this(da, type):
         return da
 
     def cast_this_da(da, v):
-        """ Cast any Argo DataArray """
+        """Cast any Argo DataArray"""
         # print("Casting %s ..." % da.name)
         da.attrs["casted"] = 0
 
-        if v in DATA_TYPES['data']['str'] and da.dtype == "O":  # Object
+        if v in DATA_TYPES["data"]["str"] and da.dtype == "O":  # Object
             da = cast_this(da, str)
 
-        if v in DATA_TYPES['data']['int']:  # and da.dtype == 'O':  # Object
+        if v in DATA_TYPES["data"]["int"]:  # and da.dtype == 'O':  # Object
             if "conventions" in da.attrs:
                 convname = "conventions"
             elif "convention" in da.attrs:
                 convname = "convention"
             else:
                 convname = None
-            if (
-                    convname in da.attrs
-                    and da.attrs[convname] in ["Argo reference table 19",
-                                               "Argo reference table 21",
-                                               "WMO float identifier : A9IIIII",
-                                               "1...N, 1 : first complete mission",
-                                               ]
-            ):
+            if convname in da.attrs and da.attrs[convname] in [
+                "Argo reference table 19",
+                "Argo reference table 21",
+                "WMO float identifier : A9IIIII",
+                "1...N, 1 : first complete mission",
+            ]:
                 # Some values may be missing, and the _FillValue=" " cannot be casted as an integer.
                 # so, we replace missing values with a 999:
                 val = da.astype(str).values
                 # val[np.where(val == 'nan')] = '999'
-                val[val == 'nan'] = '999'
+                val[val == "nan"] = "999"
                 da.values = val
             da = cast_this(da, float)
             da = cast_this(da, int)
 
-        if v in DATA_TYPES['data']['datetime'] and da.dtype == "O":  # Object
+        if v in DATA_TYPES["data"]["datetime"] and da.dtype == "O":  # Object
             if (
-                    "conventions" in da.attrs
-                    and da.attrs["conventions"] == "YYYYMMDDHHMISS"
+                "conventions" in da.attrs
+                and da.attrs["conventions"] == "YYYYMMDDHHMISS"
             ):
                 if da.size != 0:
                     if len(da.dims) <= 1:
@@ -290,16 +302,16 @@ def cast_this_da(da, v):
                         val[val == "              "] = "nan"
                         s.values = pd.to_datetime(val, format="%Y%m%d%H%M%S")
                         da.values = s.unstack("dummy_index")
-                    da = cast_this(da, 'datetime64[ns]')
+                    da = cast_this(da, "datetime64[ns]")
                 else:
-                    da = cast_this(da, 'datetime64[ns]')
+                    da = cast_this(da, "datetime64[ns]")
 
             elif v == "SCIENTIFIC_CALIB_DATE":
                 da = cast_this(da, str)
                 s = da.stack(dummy_index=da.dims)
                 s.values = pd.to_datetime(s.values, format="%Y%m%d%H%M%S")
                 da.values = (s.unstack("dummy_index")).values
-                da = cast_this(da, 'datetime64[ns]')
+                da = cast_this(da, "datetime64[ns]")
 
         if "QC" in v and "PROFILE" not in v and "QCTEST" not in v:
             if da.dtype == "O":  # convert object to string
@@ -309,18 +321,18 @@ def cast_this_da(da, v):
             # (replace missing or nan values by a '0' that will be cast as an integer later
             if da.dtype == float:
                 val = da.astype(str).values
-                val[np.where(val == 'nan')] = '0'
+                val[np.where(val == "nan")] = "0"
                 da.values = val
                 da = cast_this(da, float)
 
             if da.dtype == "<U3":  # string, len 3 because of a 'nan' somewhere
                 ii = (
-                        da == "   "
+                    da == "   "
                 )  # This should not happen, but still ! That's real world data
                 da = xr.where(ii, "0", da)
 
                 ii = (
-                        da == "nan"
+                    da == "nan"
                 )  # This should not happen, but still ! That's real world data
                 da = xr.where(ii, "0", da)
 
@@ -329,17 +341,17 @@ def cast_this_da(da, v):
 
             if da.dtype == "<U1":  # string
                 ii = (
-                        da == ""
+                    da == ""
                 )  # This should not happen, but still ! That's real world data
                 da = xr.where(ii, "0", da)
 
                 ii = (
-                        da == " "
+                    da == " "
                 )  # This should not happen, but still ! That's real world data
                 da = xr.where(ii, "0", da)
 
                 ii = (
-                        da == "n"
+                    da == "n"
                 )  # This should not happen, but still ! That's real world data
                 da = xr.where(ii, "0", da)
 
@@ -347,7 +359,7 @@ def cast_this_da(da, v):
             da = cast_this(da, int)
 
         if "DATA_MODE" in v:
-            da = cast_this(da, '<U1')
+            da = cast_this(da, "<U1")
 
         if da.dtype != "O":
             da.attrs["casted"] = 1
@@ -355,7 +367,7 @@ def cast_this_da(da, v):
         return da
 
     for v in ds.variables:
-        if overwrite or ('casted' in ds[v].attrs and ds[v].attrs['casted'] == 0):
+        if overwrite or ("casted" in ds[v].attrs and ds[v].attrs["casted"] == 0):
             try:
                 ds[v] = cast_this_da(ds[v], v)
             except Exception:
@@ -375,4 +387,3 @@ def to_list(obj):
         else:
             obj = [obj]
     return obj
-
diff --git a/argopy/utils/checkers.py b/argopy/utils/checkers.py
index bab13401..4000ae1e 100644
--- a/argopy/utils/checkers.py
+++ b/argopy/utils/checkers.py
@@ -21,7 +21,7 @@
 
 
 def is_indexbox(box: list, errors="raise"):
-    """ Check if this array matches a 2d or 3d index box definition
+    """Check if this array matches a 2d or 3d index box definition
 
     Argopy expects one of the following 2 format to define an index box:
 
@@ -39,6 +39,7 @@ def is_indexbox(box: list, errors="raise"):
     -------
     bool
     """
+
     def is_dateconvertible(d):
         try:
             pd.to_datetime(d)
@@ -215,14 +216,14 @@ def is_list_of_datasets(lst):
 
 
 def is_list_equal(lst1, lst2):
-    """ Return true if 2 lists contain same elements"""
+    """Return true if 2 lists contain same elements"""
     return len(lst1) == len(lst2) and len(lst1) == sum(
         [1 for i, j in zip(lst1, lst2) if i == j]
     )
 
 
 def check_wmo(lst, errors="raise"):
-    """ Validate a WMO option and returned it as a list of integers
+    """Validate a WMO option and returned it as a list of integers
 
     Parameters
     ----------
@@ -245,7 +246,7 @@ def check_wmo(lst, errors="raise"):
 
 
 def is_wmo(lst, errors="raise"):  # noqa: C901
-    """ Check if a WMO is valid
+    """Check if a WMO is valid
 
     Parameters
     ----------
@@ -284,20 +285,20 @@ def is_wmo(lst, errors="raise"):  # noqa: C901
         result = False
         if errors == "raise":
             raise ValueError(msg(x))
-        elif errors == 'warn':
+        elif errors == "warn":
             warnings.warn(msg(x))
 
     if not result:
         if errors == "raise":
             raise ValueError(msg(x))
-        elif errors == 'warn':
+        elif errors == "warn":
             warnings.warn(msg(x))
     else:
         return result
 
 
 def check_cyc(lst, errors="raise"):
-    """ Validate a CYC option and returned it as a list of integers
+    """Validate a CYC option and returned it as a list of integers
 
     Parameters
     ----------
@@ -320,7 +321,7 @@ def check_cyc(lst, errors="raise"):
 
 
 def is_cyc(lst, errors="raise"):  # noqa: C901
-    """ Check if a CYC is valid
+    """Check if a CYC is valid
     Parameters
     ----------
     cyc: int, list(int), array(int)
@@ -345,7 +346,7 @@ def is_cyc(lst, errors="raise"):  # noqa: C901
             if not str(x).isdigit():
                 result = False
 
-            if (len(str(x)) > 4):
+            if len(str(x)) > 4:
                 result = False
 
             if int(x) < 0:
@@ -355,34 +356,55 @@ def is_cyc(lst, errors="raise"):  # noqa: C901
         result = False
         if errors == "raise":
             raise ValueError(msg(x))
-        elif errors == 'warn':
+        elif errors == "warn":
             warnings.warn(msg(x))
 
     if not result:
         if errors == "raise":
             raise ValueError(msg(x))
-        elif errors == 'warn':
+        elif errors == "warn":
             warnings.warn(msg(x))
     else:
         return result
 
 
-def check_index_cols(column_names: list, convention: str = 'ar_index_global_prof'):
+def check_index_cols(column_names: list, convention: str = "ar_index_global_prof"):
     """
-        ar_index_global_prof.txt: Index of profile files
-        Profile directory file of the Argo Global Data Assembly Center
-        file,date,latitude,longitude,ocean,profiler_type,institution,date_update
+    ar_index_global_prof.txt: Index of profile files
+    Profile directory file of the Argo Global Data Assembly Center
+    file,date,latitude,longitude,ocean,profiler_type,institution,date_update
 
-        argo_bio-profile_index.txt: bgc Argo profiles index file
-        The directory file describes all individual bio-profile files of the argo GDAC ftp site.
-        file,date,latitude,longitude,ocean,profiler_type,institution,parameters,parameter_data_mode,date_update
+    argo_bio-profile_index.txt: bgc Argo profiles index file
+    The directory file describes all individual bio-profile files of the argo GDAC ftp site.
+    file,date,latitude,longitude,ocean,profiler_type,institution,parameters,parameter_data_mode,date_update
     """
     # Default for 'ar_index_global_prof'
-    ref = ['file', 'date', 'latitude', 'longitude', 'ocean', 'profiler_type', 'institution',
-           'date_update']
-    if convention == 'argo_bio-profile_index' or convention == 'argo_synthetic-profile_index':
-        ref = ['file', 'date', 'latitude', 'longitude', 'ocean', 'profiler_type', 'institution',
-               'parameters', 'parameter_data_mode', 'date_update']
+    ref = [
+        "file",
+        "date",
+        "latitude",
+        "longitude",
+        "ocean",
+        "profiler_type",
+        "institution",
+        "date_update",
+    ]
+    if (
+        convention == "argo_bio-profile_index"
+        or convention == "argo_synthetic-profile_index"
+    ):
+        ref = [
+            "file",
+            "date",
+            "latitude",
+            "longitude",
+            "ocean",
+            "profiler_type",
+            "institution",
+            "parameters",
+            "parameter_data_mode",
+            "date_update",
+        ]
 
     if not is_list_equal(column_names, ref):
         # log.debug("Expected: %s, got: %s" % (";".join(ref), ";".join(column_names)))
@@ -391,54 +413,54 @@ def check_index_cols(column_names: list, convention: str = 'ar_index_global_prof
         return column_names
 
 
-def check_gdac_path(path, errors='ignore'):  # noqa: C901
-    """ Check if a path has the expected GDAC ftp structure
-
-        Expected GDAC ftp structure::
-
-            .
-            └── dac
-                ├── aoml
-                ├── ...
-                ├── coriolis
-                ├── ...
-                ├── meds
-                └── nmdis
-
-        This check will return True if at least one DAC sub-folder is found under path/dac/<dac_name>
-
-        Examples::
-        >>> check_gdac_path("https://data-argo.ifremer.fr")  # True
-        >>> check_gdac_path("ftp://ftp.ifremer.fr/ifremer/argo") # True
-        >>> check_gdac_path("ftp://usgodae.org/pub/outgoing/argo") # True
-        >>> check_gdac_path("/home/ref-argo/gdac") # True
-        >>> check_gdac_path("https://www.ifremer.fr") # False
-        >>> check_gdac_path("ftp://usgodae.org/pub/outgoing") # False
-
-        Parameters
-        ----------
-        path: str
-            Path name to check, including access protocol
-        errors: str
-            "ignore" or "raise" (or "warn")
-
-        Returns
-        -------
-        checked: boolean
-            True if at least one DAC folder is found under path/dac/<dac_name>
-            False otherwise
+def check_gdac_path(path, errors="ignore"):  # noqa: C901
+    """Check if a path has the expected GDAC ftp structure
+
+    Expected GDAC ftp structure::
+
+        .
+        └── dac
+            ├── aoml
+            ├── ...
+            ├── coriolis
+            ├── ...
+            ├── meds
+            └── nmdis
+
+    This check will return True if at least one DAC sub-folder is found under path/dac/<dac_name>
+
+    Examples::
+    >>> check_gdac_path("https://data-argo.ifremer.fr")  # True
+    >>> check_gdac_path("ftp://ftp.ifremer.fr/ifremer/argo") # True
+    >>> check_gdac_path("ftp://usgodae.org/pub/outgoing/argo") # True
+    >>> check_gdac_path("/home/ref-argo/gdac") # True
+    >>> check_gdac_path("https://www.ifremer.fr") # False
+    >>> check_gdac_path("ftp://usgodae.org/pub/outgoing") # False
+
+    Parameters
+    ----------
+    path: str
+        Path name to check, including access protocol
+    errors: str
+        "ignore" or "raise" (or "warn")
+
+    Returns
+    -------
+    checked: boolean
+        True if at least one DAC folder is found under path/dac/<dac_name>
+        False otherwise
     """
     # Create a file system for this path
     if split_protocol(path)[0] is None:
-        fs = fsspec.filesystem('file')
-    elif 'https' in split_protocol(path)[0]:
-        fs = fsspec.filesystem('http')
-    elif 'ftp' in split_protocol(path)[0]:
+        fs = fsspec.filesystem("file")
+    elif "https" in split_protocol(path)[0]:
+        fs = fsspec.filesystem("http")
+    elif "ftp" in split_protocol(path)[0]:
         try:
-            host = split_protocol(path)[-1].split('/')[0]
-            fs = fsspec.filesystem('ftp', host=host)
+            host = split_protocol(path)[-1].split("/")[0]
+            fs = fsspec.filesystem("ftp", host=host)
         except gaierror:
-            if errors == 'raise':
+            if errors == "raise":
                 raise FtpPathError("Can't get address info (GAIerror) on '%s'" % host)
             elif errors == "warn":
                 warnings.warn("Can't get address info (GAIerror) on '%s'" % host)
@@ -446,7 +468,9 @@ def check_gdac_path(path, errors='ignore'):  # noqa: C901
             else:
                 return False
     else:
-        raise FtpPathError("Unknown protocol for an Argo GDAC host: %s" % split_protocol(path)[0])
+        raise FtpPathError(
+            "Unknown protocol for an Argo GDAC host: %s" % split_protocol(path)[0]
+        )
 
     # dacs = [
     #     "aoml",
@@ -471,7 +495,10 @@ def check_gdac_path(path, errors='ignore'):  # noqa: C901
     if check1:
         return True
     elif errors == "raise":
-        raise FtpPathError("This path is not GDAC compliant (no `dac` folder with legitimate sub-folder):\n%s" % path)
+        raise FtpPathError(
+            "This path is not GDAC compliant (no `dac` folder with legitimate sub-folder):\n%s"
+            % path
+        )
 
     elif errors == "warn":
         warnings.warn("This path is not GDAC compliant:\n%s" % path)
@@ -483,16 +510,16 @@ def check_gdac_path(path, errors='ignore'):  # noqa: C901
 def isconnected(host: str = "https://www.ifremer.fr", maxtry: int = 10):
     """Check if an URL is alive
 
-        Parameters
-        ----------
-        host: str
-            URL to use, 'https://www.ifremer.fr' by default
-        maxtry: int, default: 10
-            Maximum number of host connections to try before
+    Parameters
+    ----------
+    host: str
+        URL to use, 'https://www.ifremer.fr' by default
+    maxtry: int, default: 10
+        Maximum number of host connections to try before
 
-        Returns
-        -------
-        bool
+    Returns
+    -------
+    bool
     """
     # log.debug("isconnected: %s" % host)
     if split_protocol(host)[0] in ["http", "https", "ftp", "sftp"]:
@@ -500,7 +527,9 @@ def isconnected(host: str = "https://www.ifremer.fr", maxtry: int = 10):
         while it < maxtry:
             try:
                 # log.debug("Checking if %s is connected ..." % host)
-                urllib.request.urlopen(host, timeout=1)  # nosec B310 because host protocol already checked
+                urllib.request.urlopen(
+                    host, timeout=1
+                )  # nosec B310 because host protocol already checked
                 result, it = True, maxtry
             except Exception:
                 result, it = False, it + 1
@@ -509,19 +538,19 @@ def isconnected(host: str = "https://www.ifremer.fr", maxtry: int = 10):
         return os.path.exists(host)
 
 
-def urlhaskeyword(url: str = "", keyword: str = '', maxtry: int = 10):
-    """ Check if a keyword is in the content of a URL
+def urlhaskeyword(url: str = "", keyword: str = "", maxtry: int = 10):
+    """Check if a keyword is in the content of a URL
 
-        Parameters
-        ----------
-        url: str
-        keyword: str
-        maxtry: int, default: 10
-            Maximum number of host connections to try before returning False
+    Parameters
+    ----------
+    url: str
+    keyword: str
+    maxtry: int, default: 10
+        Maximum number of host connections to try before returning False
 
-        Returns
-        -------
-        bool
+    Returns
+    -------
+    bool
     """
     it = 0
     while it < maxtry:
@@ -538,45 +567,47 @@ def urlhaskeyword(url: str = "", keyword: str = '', maxtry: int = 10):
 def isalive(api_server_check: Union[str, dict] = "") -> bool:
     """Check if an API is alive or not
 
-        2 methods are available:
+    2 methods are available:
 
-        - URL Ping
-        - keyword Check
+    - URL Ping
+    - keyword Check
 
-        Parameters
-        ----------
-        api_server_check
-            Url string or dictionary with [``url``, ``keyword``] keys.
+    Parameters
+    ----------
+    api_server_check
+        Url string or dictionary with [``url``, ``keyword``] keys.
 
-            - For a string, uses: :class:`argopy.utilities.isconnected`
-            - For a dictionary,  uses: :class:`argopy.utilities.urlhaskeyword`
+        - For a string, uses: :class:`argopy.utilities.isconnected`
+        - For a dictionary,  uses: :class:`argopy.utilities.urlhaskeyword`
 
-        Returns
-        -------
-        bool
+    Returns
+    -------
+    bool
     """
     # log.debug("isalive: %s" % api_server_check)
     if isinstance(api_server_check, dict):
-        return urlhaskeyword(url=api_server_check['url'], keyword=api_server_check['keyword'])
+        return urlhaskeyword(
+            url=api_server_check["url"], keyword=api_server_check["keyword"]
+        )
     else:
         return isconnected(api_server_check)
 
 
 def isAPIconnected(src="erddap", data=True):
-    """ Check if a source API is alive or not
+    """Check if a source API is alive or not
 
-        The API is connected when it has a live URL or valid folder path.
+    The API is connected when it has a live URL or valid folder path.
 
-        Parameters
-        ----------
-        src: str
-            The data or index source name, 'erddap' default
-        data: bool
-            If True check the data fetcher (default), if False, check the index fetcher
+    Parameters
+    ----------
+    src: str
+        The data or index source name, 'erddap' default
+    data: bool
+        If True check the data fetcher (default), if False, check the index fetcher
 
-        Returns
-        -------
-        bool
+    Returns
+    -------
+    bool
     """
     if data:
         list_src = list_available_data_src()
@@ -590,11 +621,9 @@ def isAPIconnected(src="erddap", data=True):
 
 
 def erddap_ds_exists(
-        ds: Union[list, str] = "ArgoFloats",
-        erddap: str = None,
-        maxtry: int = 2
+    ds: Union[list, str] = "ArgoFloats", erddap: str = None, maxtry: int = 2
 ) -> bool:
-    """ Check if a dataset exists on a remote erddap server
+    """Check if a dataset exists on a remote erddap server
 
     Parameter
     ---------
@@ -610,18 +639,25 @@ def erddap_ds_exists(
     bool
     """
     if erddap is None:
-        erddap = OPTIONS['erddap']
+        erddap = OPTIONS["erddap"]
     # log.debug("from erddap_ds_exists: %s" % erddap)
     if isconnected(erddap, maxtry=maxtry):
-        from ..stores import httpstore
-        with httpstore(timeout=OPTIONS['api_timeout']).open("".join([erddap, "/info/index.json"])) as of:
+        from ..stores import httpstore  # must import here to avoid circular import
+
+        with httpstore(timeout=OPTIONS["api_timeout"]).open(
+            "".join([erddap, "/info/index.json"])
+        ) as of:
             erddap_index = json.load(of)
         if is_list_of_strings(ds):
-            return [this_ds in [row[-1] for row in erddap_index["table"]["rows"]] for this_ds in ds]
+            return [
+                this_ds in [row[-1] for row in erddap_index["table"]["rows"]]
+                for this_ds in ds
+            ]
         else:
             return ds in [row[-1] for row in erddap_index["table"]["rows"]]
     else:
         log.debug("Cannot reach erddap server: %s" % erddap)
-        warnings.warn("Return False because we cannot reach the erddap server %s" % erddap)
+        warnings.warn(
+            "Return False because we cannot reach the erddap server %s" % erddap
+        )
         return False
-
diff --git a/argopy/utils/chunking.py b/argopy/utils/chunking.py
index 2b72fe52..9e900d54 100644
--- a/argopy/utils/chunking.py
+++ b/argopy/utils/chunking.py
@@ -5,6 +5,7 @@
 from .checkers import is_box
 
 import collections
+
 try:
     collectionsAbc = collections.abc
 except AttributeError:
@@ -12,7 +13,7 @@
 
 
 class Chunker:
-    """ To chunk fetcher requests """
+    """To chunk fetcher requests"""
 
     # Default maximum chunks size for all possible request parameters
     default_chunksize = {
@@ -26,7 +27,7 @@ class Chunker:
     }  # Nb of cycles
 
     def __init__(self, request: dict, chunks: str = "auto", chunksize: dict = {}):
-        """ Create a request Chunker
+        """Create a request Chunker
 
         Allow to easily split an access point request into chunks
 
@@ -86,23 +87,23 @@ def __init__(self, request: dict, chunks: str = "auto", chunksize: dict = {}):
     def _split(self, lst, n=1):
         """Yield successive n-sized chunks from lst"""
         for i in range(0, len(lst), n):
-            yield lst[i: i + n]
+            yield lst[i : i + n]
 
     def _split_list_bychunknb(self, lst, n=1):
         """Split list in n-imposed chunks of similar size
-            The last chunk may contain less element than the others, depending on the size of the list.
+        The last chunk may contain less element than the others, depending on the size of the list.
         """
         res = []
         s = int(np.floor_divide(len(lst), n))
         for i in self._split(lst, s):
             res.append(i)
         if len(res) > n:
-            res[n - 1::] = [reduce(lambda i, j: i + j, res[n - 1::])]
+            res[n - 1 : :] = [reduce(lambda i, j: i + j, res[n - 1 : :])]
         return res
 
     def _split_list_bychunksize(self, lst, max_size=1):
         """Split list in chunks of imposed size
-            The last chunk may contain less element than the others, depending on the size of the list.
+        The last chunk may contain less element than the others, depending on the size of the list.
         """
         res = []
         for i in self._split(lst, max_size):
@@ -110,7 +111,7 @@ def _split_list_bychunksize(self, lst, max_size=1):
         return res
 
     def _split_box(self, large_box, n=1, d="x"):  # noqa: C901
-        """Split a box domain in one direction in n-imposed equal chunks """
+        """Split a box domain in one direction in n-imposed equal chunks"""
         if d == "x":
             i_left, i_right = 0, 1
         if d == "y":
@@ -133,7 +134,7 @@ def _split_box(self, large_box, n=1, d="x"):  # noqa: C901
                     this_box[i_right] = right
                     boxes.append(this_box)
         elif "t" in d:
-            dates = pd.to_datetime(large_box[i_left: i_right + 1])
+            dates = pd.to_datetime(large_box[i_left : i_right + 1])
             date_bounds = [
                 d.strftime("%Y%m%d%H%M%S")
                 for d in pd.date_range(dates[0], dates[1], periods=n + 1)
@@ -271,7 +272,7 @@ def _chunker_wmo(self, request, chunks, chunks_maxsize):
         return {"chunks": sorted(n_chunks), "values": wmo_grps}
 
     def fit_transform(self):
-        """ Chunk a fetcher request
+        """Chunk a fetcher request
 
         Returns
         -------
diff --git a/argopy/utils/compute.py b/argopy/utils/compute.py
index 8a89eebb..62e59ef0 100644
--- a/argopy/utils/compute.py
+++ b/argopy/utils/compute.py
@@ -18,12 +18,7 @@
 
 
 def linear_interpolation_remap(
-    z,
-    data,
-    z_regridded,
-    z_dim=None,
-    z_regridded_dim="regridded",
-    output_dim="remapped"
+    z, data, z_regridded, z_dim=None, z_regridded_dim="regridded", output_dim="remapped"
 ):
     # interpolation called in xarray ufunc
     def _regular_interp(x, y, target_values):
diff --git a/argopy/utils/decorators.py b/argopy/utils/decorators.py
index 6cff7e56..5693348e 100644
--- a/argopy/utils/decorators.py
+++ b/argopy/utils/decorators.py
@@ -35,23 +35,21 @@ def __get__(self, obj, cls):
             return self.get_no_inst(cls)
 
     def get_with_inst(self, obj, cls):
-
         overridden = getattr(super(cls, obj), self.name, None)
 
-        @wraps(self.mthd, assigned=('__name__', '__module__'))
+        @wraps(self.mthd, assigned=("__name__", "__module__"))
         def f(*args, **kwargs):
             return self.mthd(obj, *args, **kwargs)
 
         return self.use_parent_doc(f, overridden)
 
     def get_no_inst(self, cls):
-
         for parent in cls.__mro__[1:]:
             overridden = getattr(parent, self.name, None)
             if overridden:
                 break
 
-        @wraps(self.mthd, assigned=('__name__', '__module__'))
+        @wraps(self.mthd, assigned=("__name__", "__module__"))
         def f(*args, **kwargs):
             return self.mthd(*args, **kwargs)
 
@@ -106,7 +104,6 @@ def old_function(x, y):
     if isinstance(reason, str):
 
         def decorator(func1):
-
             if inspect.isclass(func1):
                 fmt1 = "Call to deprecated class {name} ({reason})."
             else:
@@ -114,13 +111,13 @@ def decorator(func1):
 
             @wraps(func1)
             def new_func1(*args, **kwargs):
-                warnings.simplefilter('always', DeprecationWarning)
+                warnings.simplefilter("always", DeprecationWarning)
                 warnings.warn(
                     fmt1.format(name=func1.__name__, reason=reason),
                     category=DeprecationWarning,
-                    stacklevel=2
+                    stacklevel=2,
                 )
-                warnings.simplefilter('default', DeprecationWarning)
+                warnings.simplefilter("default", DeprecationWarning)
                 return func1(*args, **kwargs)
 
             return new_func1
@@ -128,7 +125,6 @@ def new_func1(*args, **kwargs):
         return decorator
 
     elif inspect.isclass(reason) or inspect.isfunction(reason):
-
         func2 = reason
 
         if inspect.isclass(func2):
@@ -138,17 +134,16 @@ def new_func1(*args, **kwargs):
 
         @wraps(func2)
         def new_func2(*args, **kwargs):
-            warnings.simplefilter('always', DeprecationWarning)
+            warnings.simplefilter("always", DeprecationWarning)
             warnings.warn(
                 fmt2.format(name=func2.__name__),
                 category=DeprecationWarning,
-                stacklevel=2
+                stacklevel=2,
             )
-            warnings.simplefilter('default', DeprecationWarning)
+            warnings.simplefilter("default", DeprecationWarning)
             return func2(*args, **kwargs)
 
         return new_func2
 
     else:
         raise TypeError(repr(type(reason)))
-
diff --git a/argopy/utils/format.py b/argopy/utils/format.py
index 85a10bf8..3377e0d9 100644
--- a/argopy/utils/format.py
+++ b/argopy/utils/format.py
@@ -10,21 +10,21 @@
 
 
 def format_oneline(s, max_width=65):
-    """ Return a string formatted for a line print """
+    """Return a string formatted for a line print"""
     if len(s) > max_width:
         padding = " ... "
         n = (max_width - len(padding)) // 2
         q = (max_width - len(padding)) % 2
         if q == 0:
-            return "".join([s[0: n], padding, s[-n:]])
+            return "".join([s[0:n], padding, s[-n:]])
         else:
-            return "".join([s[0: n + 1], padding, s[-n:]])
+            return "".join([s[0 : n + 1], padding, s[-n:]])
     else:
         return s
 
 
 def argo_split_path(this_path):  # noqa C901
-    """ Split path from a GDAC ftp style Argo netcdf file and return information
+    """Split path from a GDAC ftp style Argo netcdf file and return information
 
     >>> argo_split_path('coriolis/6901035/profiles/D6901035_001D.nc')
     >>> argo_split_path('https://data-argo.ifremer.fr/dac/csiro/5903939/profiles/D5903939_103.nc')
@@ -52,9 +52,11 @@ def argo_split_path(this_path):  # noqa C901
     ]
     output = {}
 
-    start_with = lambda f, x: f[0:len(x)] == x if len(x) <= len(f) else False  # noqa: E731
+    start_with = (
+        lambda f, x: f[0 : len(x)] == x if len(x) <= len(f) else False
+    )  # noqa: E731
 
-    def split_path(p, sep='/'):
+    def split_path(p, sep="/"):
         """Split a pathname.  Returns tuple "(head, tail)" where "tail" is
         everything after the final slash.  Either part may be empty."""
         # Same as posixpath.py but we get to choose the file separator !
@@ -66,27 +68,31 @@ def split_path(p, sep='/'):
         return head, tail
 
     def fix_localhost(host):
-        if 'ftp://localhost:' in host:
+        if "ftp://localhost:" in host:
             return "ftp://%s" % (urlparse(host).netloc)
-        if 'http://127.0.0.1:' in host:
+        if "http://127.0.0.1:" in host:
             return "http://%s" % (urlparse(host).netloc)
         else:
             return ""
 
-    known_origins = ['https://data-argo.ifremer.fr',
-                     'ftp://ftp.ifremer.fr/ifremer/argo',
-                     'ftp://usgodae.org/pub/outgoing/argo',
-                     fix_localhost(this_path),
-                     '']
+    known_origins = [
+        "https://data-argo.ifremer.fr",
+        "ftp://ftp.ifremer.fr/ifremer/argo",
+        "ftp://usgodae.org/pub/outgoing/argo",
+        fix_localhost(this_path),
+        "",
+    ]
 
-    output['origin'] = [origin for origin in known_origins if start_with(this_path, origin)][0]
-    output['origin'] = '.' if output['origin'] == '' else output['origin'] + '/'
-    sep = '/' if output['origin'] != '.' else os.path.sep
+    output["origin"] = [
+        origin for origin in known_origins if start_with(this_path, origin)
+    ][0]
+    output["origin"] = "." if output["origin"] == "" else output["origin"] + "/"
+    sep = "/" if output["origin"] != "." else os.path.sep
 
     (path, file) = split_path(this_path, sep=sep)
 
-    output['path'] = path.replace(output['origin'], '')
-    output['name'] = file
+    output["path"] = path.replace(output["origin"], "")
+    output["name"] = file
 
     # Deal with the path:
     # dac/<DAC>/<FloatWmoID>/
@@ -94,14 +100,14 @@ def fix_localhost(host):
     path_parts = path.split(sep)
 
     try:
-        if path_parts[-1] == 'profiles':
-            output['type'] = 'Mono-cycle profile file'
-            output['wmo'] = path_parts[-2]
-            output['dac'] = path_parts[-3]
+        if path_parts[-1] == "profiles":
+            output["type"] = "Mono-cycle profile file"
+            output["wmo"] = path_parts[-2]
+            output["dac"] = path_parts[-3]
         else:
-            output['type'] = 'Multi-cycle profile file'
-            output['wmo'] = path_parts[-1]
-            output['dac'] = path_parts[-2]
+            output["type"] = "Multi-cycle profile file"
+            output["wmo"] = path_parts[-1]
+            output["dac"] = path_parts[-2]
     except Exception:
         log.warning(this_path)
         log.warning(path)
@@ -110,79 +116,87 @@ def fix_localhost(host):
         log.warning(output)
         raise
 
-    if output['dac'] not in dacs:
+    if output["dac"] not in dacs:
         log.debug("This is not a Argo GDAC compliant file path: %s" % path)
         log.warning(this_path)
         log.warning(path)
         log.warning(sep)
         log.warning(path_parts)
         log.warning(output)
-        raise ValueError("This is not a Argo GDAC compliant file path (invalid DAC name: '%s')" % output['dac'])
+        raise ValueError(
+            "This is not a Argo GDAC compliant file path (invalid DAC name: '%s')"
+            % output["dac"]
+        )
 
     # Deal with the file name:
-    filename, file_extension = os.path.splitext(output['name'])
-    output['extension'] = file_extension
-    if file_extension != '.nc':
+    filename, file_extension = os.path.splitext(output["name"])
+    output["extension"] = file_extension
+    if file_extension != ".nc":
         raise ValueError(
-            "This is not a Argo GDAC compliant file path (invalid file extension: '%s')" % file_extension)
-    filename_parts = output['name'].split("_")
-
-    if "Mono" in output['type']:
-        prefix = filename_parts[0].split(output['wmo'])[0]
-        if 'R' in prefix:
-            output['data_mode'] = 'R, Real-time data'
-        if 'D' in prefix:
-            output['data_mode'] = 'D, Delayed-time data'
-
-        if 'S' in prefix:
-            output['type'] = 'S, Synthetic BGC Mono-cycle profile file'
-        if 'M' in prefix:
-            output['type'] = 'M, Merged BGC Mono-cycle profile file'
-        if 'B' in prefix:
-            output['type'] = 'B, BGC Mono-cycle profile file'
-
-        suffix = filename_parts[-1].split(output['wmo'])[-1]
-        if 'D' in suffix:
-            output['direction'] = 'D, descending profiles'
-        elif suffix == "" and "Mono" in output['type']:
-            output['direction'] = 'A, ascending profiles (implicit)'
+            "This is not a Argo GDAC compliant file path (invalid file extension: '%s')"
+            % file_extension
+        )
+    filename_parts = output["name"].split("_")
+
+    if "Mono" in output["type"]:
+        prefix = filename_parts[0].split(output["wmo"])[0]
+        if "R" in prefix:
+            output["data_mode"] = "R, Real-time data"
+        if "D" in prefix:
+            output["data_mode"] = "D, Delayed-time data"
+
+        if "S" in prefix:
+            output["type"] = "S, Synthetic BGC Mono-cycle profile file"
+        if "M" in prefix:
+            output["type"] = "M, Merged BGC Mono-cycle profile file"
+        if "B" in prefix:
+            output["type"] = "B, BGC Mono-cycle profile file"
+
+        suffix = filename_parts[-1].split(output["wmo"])[-1]
+        if "D" in suffix:
+            output["direction"] = "D, descending profiles"
+        elif suffix == "" and "Mono" in output["type"]:
+            output["direction"] = "A, ascending profiles (implicit)"
 
     else:
         typ = filename_parts[-1].split(".nc")[0]
-        if typ == 'prof':
-            output['type'] = 'Multi-cycle file'
-        if typ == 'Sprof':
-            output['type'] = 'S, Synthetic BGC Multi-cycle profiles file'
-        if typ == 'tech':
-            output['type'] = 'Technical data file'
-        if typ == 'meta':
-            output['type'] = 'Metadata file'
-        if 'traj' in typ:
+        if typ == "prof":
+            output["type"] = "Multi-cycle file"
+        if typ == "Sprof":
+            output["type"] = "S, Synthetic BGC Multi-cycle profiles file"
+        if typ == "tech":
+            output["type"] = "Technical data file"
+        if typ == "meta":
+            output["type"] = "Metadata file"
+        if "traj" in typ:
             # possible typ = [Rtraj, Dtraj, BRtraj, BDtraj]
-            output['type'], i = 'Trajectory file', 0
-            if typ[0] == 'B':
-                output['type'], i = 'BGC Trajectory file', 1
-            if typ.split("traj")[0][i] == 'D':
-                output['data_mode'] = 'D, Delayed-time data'
-            elif typ.split("traj")[0][i] == 'R':
-                output['data_mode'] = 'R, Real-time data'
+            output["type"], i = "Trajectory file", 0
+            if typ[0] == "B":
+                output["type"], i = "BGC Trajectory file", 1
+            if typ.split("traj")[0][i] == "D":
+                output["data_mode"] = "D, Delayed-time data"
+            elif typ.split("traj")[0][i] == "R":
+                output["data_mode"] = "R, Real-time data"
             else:
-                output['data_mode'] = 'R, Real-time data (implicit)'
+                output["data_mode"] = "R, Real-time data (implicit)"
 
     # Adjust origin and path for local files:
     # This ensure that output['path'] is agnostic to users and can be reused on any gdac compliant architecture
     parts = path.split(sep)
     i, stop = len(parts) - 1, False
     while not stop:
-        if parts[i] == 'profiles' or parts[i] == output['wmo'] or parts[i] == output['dac'] or parts[i] == 'dac':
+        if (
+            parts[i] == "profiles"
+            or parts[i] == output["wmo"]
+            or parts[i] == output["dac"]
+            or parts[i] == "dac"
+        ):
             i = i - 1
             if i < 0:
                 stop = True
         else:
             stop = True
-    output['origin'] = sep.join(parts[0:i + 1])
-    output['path'] = output['path'].replace(output['origin'], '')
+    output["origin"] = sep.join(parts[0 : i + 1])
+    output["path"] = output["path"].replace(output["origin"], "")
 
     return dict(sorted(output.items()))
-
-
diff --git a/argopy/utils/geo.py b/argopy/utils/geo.py
index cc304f41..ed6a27e0 100644
--- a/argopy/utils/geo.py
+++ b/argopy/utils/geo.py
@@ -3,22 +3,23 @@
 
 
 def wrap_longitude(grid_long):
-    """ Allows longitude (0-360) to wrap beyond the 360 mark, for mapping purposes.
-        Makes sure that, if the longitude is near the boundary (0 or 360) that we
-        wrap the values beyond 360 so it appears nicely on a map
-        This is a refactor between get_region_data and get_region_hist_locations to
-        avoid duplicate code
-
-        source:
-        https://github.com/euroargodev/argodmqc_owc/blob/e174f4538fdae1534c9740491398972b1ffec3ca/pyowc/utilities.py#L80
-
-        Parameters
-        ----------
-        grid_long: array of longitude values
-
-        Returns
-        -------
-        array of longitude values that can extend past 360
+    """Allows longitude (0-360) to wrap beyond the 360 mark, for mapping purposes.
+
+    Makes sure that, if the longitude is near the boundary (0 or 360) that we
+    wrap the values beyond 360, so it appears nicely on a map
+    This is a refactor between get_region_data and get_region_hist_locations to
+    avoid duplicate code
+
+    source:
+    https://github.com/euroargodev/argodmqc_owc/blob/e174f4538fdae1534c9740491398972b1ffec3ca/pyowc/utilities.py#L80
+
+    Parameters
+    ----------
+    grid_long: array of longitude values
+
+    Returns
+    -------
+    array of longitude values that can extend past 360
     """
     neg_long = np.argwhere(grid_long < 0)
     grid_long[neg_long] = grid_long[neg_long] + 360
@@ -34,7 +35,7 @@ def wrap_longitude(grid_long):
 
 
 def wmo2box(wmo_id: int):
-    """ Convert WMO square box number into a latitude/longitude box
+    """Convert WMO square box number into a latitude/longitude box
 
     See:
     https://en.wikipedia.org/wiki/World_Meteorological_Organization_squares
@@ -88,7 +89,7 @@ def wmo2box(wmo_id: int):
 def toYearFraction(
     this_date: pd._libs.tslibs.timestamps.Timestamp = pd.to_datetime("now", utc=True)
 ):
-    """ Compute decimal year, robust to leap years, precision to the second
+    """Compute decimal year, robust to leap years, precision to the second
 
     Compute the fraction of the year a given timestamp corresponds to.
     The "fraction of the year" goes:
@@ -109,7 +110,9 @@ def toYearFraction(
     float
     """
     if "UTC" in [this_date.tzname() if this_date.tzinfo is not None else ""]:
-        startOfThisYear = pd.to_datetime("%i-01-01T00:00:00.000" % this_date.year, utc=True)
+        startOfThisYear = pd.to_datetime(
+            "%i-01-01T00:00:00.000" % this_date.year, utc=True
+        )
     else:
         startOfThisYear = pd.to_datetime("%i-01-01T00:00:00.000" % this_date.year)
     yearDuration_sec = (
@@ -123,7 +126,7 @@ def toYearFraction(
 
 
 def YearFraction_to_datetime(yf: float):
-    """ Compute datetime from year fraction
+    """Compute datetime from year fraction
 
     Inverse the toYearFraction() function
 
@@ -145,5 +148,3 @@ def YearFraction_to_datetime(yf: float):
     ).total_seconds()
     yearElapsed_sec = pd.Timedelta(fraction * yearDuration_sec, unit="s")
     return pd.to_datetime(startOfThisYear + yearElapsed_sec, unit="s")
-
-
diff --git a/argopy/utils/lists.py b/argopy/utils/lists.py
index 78567313..32ae6f82 100644
--- a/argopy/utils/lists.py
+++ b/argopy/utils/lists.py
@@ -4,13 +4,16 @@
 
 
 def list_available_data_src():
-    """ List all available data sources """
+    """List all available data sources"""
     sources = {}
     try:
         from ..data_fetchers import erddap_data as Erddap_Fetchers
+
         # Ensure we're loading the erddap data fetcher with the current options:
-        Erddap_Fetchers.api_server_check = Erddap_Fetchers.api_server_check.replace(Erddap_Fetchers.api_server, OPTIONS['erddap'])
-        Erddap_Fetchers.api_server = OPTIONS['erddap']
+        Erddap_Fetchers.api_server_check = Erddap_Fetchers.api_server_check.replace(
+            Erddap_Fetchers.api_server, OPTIONS["erddap"]
+        )
+        Erddap_Fetchers.api_server = OPTIONS["erddap"]
 
         sources["erddap"] = Erddap_Fetchers
     except Exception:
@@ -35,9 +38,10 @@ def list_available_data_src():
 
     try:
         from ..data_fetchers import gdacftp_data as GDAC_Fetchers
+
         # Ensure we're loading the gdac data fetcher with the current options:
-        GDAC_Fetchers.api_server_check = OPTIONS['ftp']
-        GDAC_Fetchers.api_server = OPTIONS['ftp']
+        GDAC_Fetchers.api_server_check = OPTIONS["ftp"]
+        GDAC_Fetchers.api_server = OPTIONS["ftp"]
 
         sources["gdac"] = GDAC_Fetchers
     except Exception:
@@ -53,13 +57,16 @@ def list_available_data_src():
 
 
 def list_available_index_src():
-    """ List all available index sources """
+    """List all available index sources"""
     sources = {}
     try:
         from ..data_fetchers import erddap_index as Erddap_Fetchers
+
         # Ensure we're loading the erddap data fetcher with the current options:
-        Erddap_Fetchers.api_server_check = Erddap_Fetchers.api_server_check.replace(Erddap_Fetchers.api_server, OPTIONS['erddap'])
-        Erddap_Fetchers.api_server = OPTIONS['erddap']
+        Erddap_Fetchers.api_server_check = Erddap_Fetchers.api_server_check.replace(
+            Erddap_Fetchers.api_server, OPTIONS["erddap"]
+        )
+        Erddap_Fetchers.api_server = OPTIONS["erddap"]
 
         sources["erddap"] = Erddap_Fetchers
     except Exception:
@@ -72,9 +79,10 @@ def list_available_index_src():
 
     try:
         from ..data_fetchers import gdacftp_index as GDAC_Fetchers
+
         # Ensure we're loading the gdac data fetcher with the current options:
-        GDAC_Fetchers.api_server_check = OPTIONS['ftp']
-        GDAC_Fetchers.api_server = OPTIONS['ftp']
+        GDAC_Fetchers.api_server_check = OPTIONS["ftp"]
+        GDAC_Fetchers.api_server = OPTIONS["ftp"]
 
         sources["gdac"] = GDAC_Fetchers
     except Exception:
@@ -89,7 +97,7 @@ def list_available_index_src():
 
 
 def list_standard_variables():
-    """ List of variables for standard users """
+    """List of variables for standard users"""
     return [
         "DATA_MODE",
         "LATITUDE",
@@ -125,9 +133,9 @@ def list_standard_variables():
 
 
 def list_multiprofile_file_variables():
-    """ List of variables in a netcdf multiprofile file.
+    """List of variables in a netcdf multiprofile file.
 
-        This is for files created by GDAC under <DAC>/<WMO>/<WMO>_prof.nc
+    This is for files created by GDAC under <DAC>/<WMO>/<WMO>_prof.nc
     """
     return [
         "CONFIG_MISSION_NUMBER",
@@ -195,4 +203,3 @@ def list_multiprofile_file_variables():
         "VERTICAL_SAMPLING_SCHEME",
         "WMO_INST_TYPE",
     ]
-
diff --git a/argopy/utils/locals.py b/argopy/utils/locals.py
index 8c282113..af46b6e7 100644
--- a/argopy/utils/locals.py
+++ b/argopy/utils/locals.py
@@ -79,7 +79,7 @@ def netcdf_and_hdf5_versions():
 
 
 def show_versions(file=sys.stdout, conda=False):  # noqa: C901
-    """ Print the versions of argopy and its dependencies
+    """Print the versions of argopy and its dependencies
 
     Parameters
     ----------
@@ -96,74 +96,98 @@ def show_versions(file=sys.stdout, conda=False):  # noqa: C901
         print(f"Error collecting netcdf / hdf5 version: {e}")
 
     DEPS = {
-        'core': sorted([
-            ("argopy", lambda mod: mod.__version__),
-
-            ("xarray", lambda mod: mod.__version__),
-            ("scipy", lambda mod: mod.__version__),
-            ("netCDF4", lambda mod: mod.__version__),
-            ("erddapy", lambda mod: mod.__version__),  # This could go away from requirements ?
-            ("fsspec", lambda mod: mod.__version__),
-            ("aiohttp", lambda mod: mod.__version__),
-            ("packaging", lambda mod: mod.__version__),  # will come with xarray, Using 'version' to make API compatible with several fsspec releases
-            ("requests", lambda mod: mod.__version__),
-            ("toolz", lambda mod: mod.__version__),
-        ]),
-        'ext.util': sorted([
-            ("gsw", lambda mod: mod.__version__),   # Used by xarray accessor to compute new variables
-            ("tqdm", lambda mod: mod.__version__),
-            ("zarr", lambda mod: mod.__version__),
-        ]),
-        'ext.perf': sorted([
-            ("dask", lambda mod: mod.__version__),
-            ("distributed", lambda mod: mod.__version__),
-            ("pyarrow", lambda mod: mod.__version__),
-        ]),
-        'ext.plot': sorted([
-            ("matplotlib", lambda mod: mod.__version__),
-            ("cartopy", lambda mod: mod.__version__),
-            ("seaborn", lambda mod: mod.__version__),
-            ("IPython", lambda mod: mod.__version__),
-            ("ipywidgets", lambda mod: mod.__version__),
-            ("ipykernel", lambda mod: mod.__version__),
-        ]),
-        'dev': sorted([
-
-            ("bottleneck", lambda mod: mod.__version__),
-            ("cftime", lambda mod: mod.__version__),
-            ("cfgrib", lambda mod: mod.__version__),
-            ("conda", lambda mod: mod.__version__),
-            ("nc_time_axis", lambda mod: mod.__version__),
-
-            ("numpy", lambda mod: mod.__version__),  # will come with xarray and pandas
-            ("pandas", lambda mod: mod.__version__),  # will come with xarray
-
-            ("pip", lambda mod: mod.__version__),
-            ("black", lambda mod: mod.__version__),
-            ("flake8", lambda mod: mod.__version__),
-            ("pytest", lambda mod: mod.__version__),  # will come with pandas
-            ("pytest_env", lambda mod: mod.__version__),  # will come with pandas
-            ("pytest_cov", lambda mod: mod.__version__),  # will come with pandas
-            ("pytest_localftpserver", lambda mod: mod.__version__),  # will come with pandas
-            ("pytest_reportlog", lambda mod: mod.__version__),  # will come with pandas
-            ("setuptools", lambda mod: mod.__version__),
-            ("aiofiles", lambda mod: mod.__version__),
-            ("sphinx", lambda mod: mod.__version__),
-        ]),
+        "core": sorted(
+            [
+                ("argopy", lambda mod: mod.__version__),
+                ("xarray", lambda mod: mod.__version__),
+                ("scipy", lambda mod: mod.__version__),
+                ("netCDF4", lambda mod: mod.__version__),
+                (
+                    "erddapy",
+                    lambda mod: mod.__version__,
+                ),  # This could go away from requirements ?
+                ("fsspec", lambda mod: mod.__version__),
+                ("aiohttp", lambda mod: mod.__version__),
+                (
+                    "packaging",
+                    lambda mod: mod.__version__,
+                ),  # will come with xarray, Using 'version' to make API compatible with several fsspec releases
+                ("requests", lambda mod: mod.__version__),
+                ("toolz", lambda mod: mod.__version__),
+            ]
+        ),
+        "ext.util": sorted(
+            [
+                (
+                    "gsw",
+                    lambda mod: mod.__version__,
+                ),  # Used by xarray accessor to compute new variables
+                ("tqdm", lambda mod: mod.__version__),
+                ("zarr", lambda mod: mod.__version__),
+            ]
+        ),
+        "ext.perf": sorted(
+            [
+                ("dask", lambda mod: mod.__version__),
+                ("distributed", lambda mod: mod.__version__),
+                ("pyarrow", lambda mod: mod.__version__),
+            ]
+        ),
+        "ext.plot": sorted(
+            [
+                ("matplotlib", lambda mod: mod.__version__),
+                ("cartopy", lambda mod: mod.__version__),
+                ("seaborn", lambda mod: mod.__version__),
+                ("IPython", lambda mod: mod.__version__),
+                ("ipywidgets", lambda mod: mod.__version__),
+                ("ipykernel", lambda mod: mod.__version__),
+            ]
+        ),
+        "dev": sorted(
+            [
+                ("bottleneck", lambda mod: mod.__version__),
+                ("cftime", lambda mod: mod.__version__),
+                ("cfgrib", lambda mod: mod.__version__),
+                ("conda", lambda mod: mod.__version__),
+                ("nc_time_axis", lambda mod: mod.__version__),
+                (
+                    "numpy",
+                    lambda mod: mod.__version__,
+                ),  # will come with xarray and pandas
+                ("pandas", lambda mod: mod.__version__),  # will come with xarray
+                ("pip", lambda mod: mod.__version__),
+                ("black", lambda mod: mod.__version__),
+                ("flake8", lambda mod: mod.__version__),
+                ("pytest", lambda mod: mod.__version__),  # will come with pandas
+                ("pytest_env", lambda mod: mod.__version__),  # will come with pandas
+                ("pytest_cov", lambda mod: mod.__version__),  # will come with pandas
+                (
+                    "pytest_localftpserver",
+                    lambda mod: mod.__version__,
+                ),  # will come with pandas
+                (
+                    "pytest_reportlog",
+                    lambda mod: mod.__version__,
+                ),  # will come with pandas
+                ("setuptools", lambda mod: mod.__version__),
+                ("aiofiles", lambda mod: mod.__version__),
+                ("sphinx", lambda mod: mod.__version__),
+            ]
+        ),
     }
 
     DEPS_blob = {}
     for level in DEPS.keys():
         deps = DEPS[level]
         deps_blob = list()
-        for (modname, ver_f) in deps:
+        for modname, ver_f in deps:
             try:
                 if modname in sys.modules:
                     mod = sys.modules[modname]
                 else:
                     mod = importlib.import_module(modname)
             except Exception:
-                deps_blob.append((modname, '-'))
+                deps_blob.append((modname, "-"))
             else:
                 try:
                     ver = ver_f(mod)
@@ -187,10 +211,12 @@ def show_versions(file=sys.stdout, conda=False):  # noqa: C901
         deps_blob = DEPS_blob[level]
         for k, stat in deps_blob:
             if conda:
-                if k != 'argopy':
+                if k != "argopy":
                     kf = k.replace("_", "-")
-                    comment = ' ' if stat != '-' else '# '
-                    print(f"{comment} - {kf} = {stat}", file=file)  # Format like a conda env line, useful to update ci/requirements
+                    comment = " " if stat != "-" else "# "
+                    print(
+                        f"{comment} - {kf} = {stat}", file=file
+                    )  # Format like a conda env line, useful to update ci/requirements
             else:
                 print("{:<12}: {:<12}".format(k, stat), file=file)
 
@@ -228,7 +254,7 @@ def modified_environ(*remove, **update):
 
 
 def show_options(file=sys.stdout):  # noqa: C901
-    """ Print options of argopy
+    """Print options of argopy
 
     Parameters
     ----------
@@ -241,4 +267,3 @@ def show_options(file=sys.stdout):  # noqa: C901
     opts = dict(sorted(opts.items()))
     for k, v in opts.items():
         print(f"{k}: {v}", file=file)
-
diff --git a/argopy/utils/loggers.py b/argopy/utils/loggers.py
index b76b8450..c0a94482 100644
--- a/argopy/utils/loggers.py
+++ b/argopy/utils/loggers.py
@@ -25,16 +25,19 @@ def warnUnless(ok, txt):
         warnings.warn(msg)
 
 
-def log_argopy_callerstack(level='debug'):
+def log_argopy_callerstack(level="debug"):
     """log the caller’s stack"""
     froot = str(pathlib.Path(__file__).parent.resolve())
     for ideep, frame in enumerate(inspect.stack()[1:]):
-        if os.path.join('argopy', 'argopy') in frame.filename:
+        if os.path.join("argopy", "argopy") in frame.filename:
             # msg = ["└─"]
             # [msg.append("─") for ii in range(ideep)]
             msg = [""]
             [msg.append("  ") for ii in range(ideep)]
-            msg.append("└─ %s:%i -> %s" % (frame.filename.replace(froot, ''), frame.lineno, frame.function))
+            msg.append(
+                "└─ %s:%i -> %s"
+                % (frame.filename.replace(froot, ""), frame.lineno, frame.function)
+            )
             msg = "".join(msg)
             if level == "info":
                 log.info(msg)
diff --git a/argopy/utils/monitors.py b/argopy/utils/monitors.py
index 09007b03..43b9b586 100644
--- a/argopy/utils/monitors.py
+++ b/argopy/utils/monitors.py
@@ -5,7 +5,7 @@
 import threading
 
 try:
-    importlib.import_module('matplotlib')  # noqa: E402
+    importlib.import_module("matplotlib")  # noqa: E402
     from matplotlib.colors import to_hex
 except ImportError:
     pass
@@ -15,7 +15,7 @@
 
 
 def badge(label="label", message="message", color="green", insert=False):
-    """ Return or insert shield.io badge image
+    """Return or insert shield.io badge image
 
         Use the shields.io service to create a badge image
 
@@ -95,13 +95,16 @@ def td_msg(bgcolor, txtcolor, txt):
         td_empty = "<td style='border-width:0px;padding: 2px 5px 2px 5px;text-align:left'>&nbsp;</td>"
 
         html = []
-        html.append("<table style='border-collapse:collapse;border-spacing:0;font-size:%ipx'>" % fs)
+        html.append(
+            "<table style='border-collapse:collapse;border-spacing:0;font-size:%ipx'>"
+            % fs
+        )
         html.append("<tbody><tr>")
         cols = []
         for api in sorted(results.keys()):
             color = "yellowgreen" if results[api]["value"] else "darkorange"
-            cols.append(td_msg('dimgray', 'w', "src %s is" % api))
-            cols.append(td_msg(color, 'w', results[api]["message"]))
+            cols.append(td_msg("dimgray", "w", "src %s is" % api))
+            cols.append(td_msg(color, "w", results[api]["message"]))
             cols.append(td_empty)
         html.append("\n".join(cols))
         html.append("</tr></tbody>")
@@ -114,12 +117,12 @@ def _repr_html_(self):
 
 
 class monitor_status:
-    """ Monitor data source status with a refresh rate """
+    """Monitor data source status with a refresh rate"""
 
     def __init__(self, refresh=60):
         self.refresh_rate = refresh
 
-        if self.runner == 'notebook':
+        if self.runner == "notebook":
             import ipywidgets as widgets
 
             self.text = widgets.HTML(
@@ -130,7 +133,7 @@ def __init__(self, refresh=60):
             self.start()
 
     def __repr__(self):
-        if self.runner != 'notebook':
+        if self.runner != "notebook":
             return self.content
         else:
             return ""
@@ -139,18 +142,18 @@ def __repr__(self):
     def runner(self) -> str:
         try:
             shell = get_ipython().__class__.__name__
-            if shell == 'ZMQInteractiveShell':
-                return 'notebook'  # Jupyter notebook or qtconsole
-            elif shell == 'TerminalInteractiveShell':
-                return 'terminal'  # Terminal running IPython
+            if shell == "ZMQInteractiveShell":
+                return "notebook"  # Jupyter notebook or qtconsole
+            elif shell == "TerminalInteractiveShell":
+                return "terminal"  # Terminal running IPython
             else:
                 return False  # Other type (?)
         except NameError:
-            return 'standard'  # Probably standard Python interpreter
+            return "standard"  # Probably standard Python interpreter
 
     @property
     def content(self):
-        if self.runner == 'notebook':
+        if self.runner == "notebook":
             return fetch_status().html
         else:
             return fetch_status().text
@@ -166,4 +169,3 @@ def start(self):
         thread = threading.Thread(target=self.work)
         display(self.text)
         thread.start()
-
diff --git a/argopy/utils/transform.py b/argopy/utils/transform.py
index df55afba..e0e0c4de 100644
--- a/argopy/utils/transform.py
+++ b/argopy/utils/transform.py
@@ -40,7 +40,10 @@ def drop_variables_not_in_all_datasets(ds_collection):
     # List of variables missing in some dataset:
     iv_missing = np.sum(ishere, axis=1) < len(ds_collection)
     if len(iv_missing) > 0:
-        log.debug("Dropping these variables that are missing from some dataset in this list: %s" % vlist[iv_missing])
+        log.debug(
+            "Dropping these variables that are missing from some dataset in this list: %s"
+            % vlist[iv_missing]
+        )
 
     # List of variables to keep
     iv_tokeep = np.sum(ishere, axis=1) == len(ds_collection)
@@ -54,7 +57,7 @@ def drop_variables_not_in_all_datasets(ds_collection):
     return ds_collection
 
 
-def fill_variables_not_in_all_datasets(ds_collection, concat_dim='rows'):
+def fill_variables_not_in_all_datasets(ds_collection, concat_dim="rows"):
     """Add empty variables to dataset so that all the collection have the same data_vars and coords
 
     This is to make sure that the collection of dataset can be concatenated
@@ -67,7 +70,8 @@ def fill_variables_not_in_all_datasets(ds_collection, concat_dim='rows'):
     -------
     list of :class:`xr.DataSet`
     """
-    def first_variable_with_concat_dim(this_ds, concat_dim='rows'):
+
+    def first_variable_with_concat_dim(this_ds, concat_dim="rows"):
         """Return the 1st variable in the collection that have the concat_dim in dims"""
         first = None
         for v in this_ds.data_vars:
@@ -77,7 +81,7 @@ def first_variable_with_concat_dim(this_ds, concat_dim='rows'):
         return first
 
     def fillvalue(da):
-        """ Return fillvalue for a dataarray """
+        """Return fillvalue for a dataarray"""
         # https://docs.scipy.org/doc/numpy/reference/generated/numpy.dtype.kind.html#numpy.dtype.kind
         if da.dtype.kind in ["U"]:
             fillvalue = " "
@@ -108,7 +112,11 @@ def fillvalue(da):
     for ir, ds in enumerate(ds_collection):
         for v in vlist:
             if v in ds.variables:
-                meta[v] = {'attrs': ds[v].attrs, 'dtype': ds[v].dtype, 'fill_value': fillvalue(ds[v])}
+                meta[v] = {
+                    "attrs": ds[v].attrs,
+                    "dtype": ds[v].dtype,
+                    "fill_value": fillvalue(ds[v]),
+                }
     # [log.debug(meta[m]) for m in meta.keys()]
 
     # Add missing variables to dataset
@@ -117,8 +125,10 @@ def fillvalue(da):
         for v in vlist:
             if v not in ds.variables:
                 like = ds[first_variable_with_concat_dim(ds, concat_dim=concat_dim)]
-                datasets[ir][v] = xr.full_like(like, fill_value=meta[v]['fill_value'], dtype=meta[v]['dtype'])
-                datasets[ir][v].attrs = meta[v]['attrs']
+                datasets[ir][v] = xr.full_like(
+                    like, fill_value=meta[v]["fill_value"], dtype=meta[v]["dtype"]
+                )
+                datasets[ir][v].attrs = meta[v]["attrs"]
 
     # Make sure that all datasets have the same set of coordinates
     results = []

From b39c868d72d973845533205def25394fbc9f4b40 Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Tue, 12 Sep 2023 14:55:33 +0200
Subject: [PATCH 24/33] fix the doc

---
 docs/api-hidden.rst | 84 +++++++++++++++++++++++++--------------------
 docs/api.rst        | 16 +++++----
 docs/conf.py        |  8 +++++
 docs/redirects.txt  | 13 +++++++
 docs/whats-new.rst  |  2 +-
 5 files changed, 77 insertions(+), 46 deletions(-)
 create mode 100644 docs/redirects.txt

diff --git a/docs/api-hidden.rst b/docs/api-hidden.rst
index 67b13130..9a5cfa78 100644
--- a/docs/api-hidden.rst
+++ b/docs/api-hidden.rst
@@ -56,43 +56,52 @@
 
     argopy.tutorial.open_dataset
 
-    argopy.utilities.monitor_status
-    argopy.utilities.show_versions
-    argopy.utilities.show_options
-    argopy.utilities.clear_cache
-    argopy.utilities.list_available_data_src
-    argopy.utilities.list_available_index_src
-    argopy.utilities.Chunker
-
-    argopy.utilities.isconnected
-    argopy.utilities.urlhaskeyword
-    argopy.utilities.isalive
-    argopy.utilities.isAPIconnected
-
-    argopy.utilities.groupby_remap
-    argopy.utilities.linear_interpolation_remap
-
-    argopy.utilities.list_standard_variables
-    argopy.utilities.list_multiprofile_file_variables
-    argopy.utilities.load_dict
-    argopy.utilities.format_oneline
-    argopy.utilities.is_box
-    argopy.utilities.is_indexbox
-    argopy.utilities.is_wmo
-    argopy.utilities.is_cyc
-    argopy.utilities.check_wmo
-    argopy.utilities.check_cyc
-    argopy.utilities.wmo2box
-    argopy.utilities.deprecated
-    argopy.utilities.Registry
-    argopy.utilities.float_wmo
-    argopy.utilities.get_coriolis_profile_id
-    argopy.utilities.get_ea_profile_page
-
-    argopy.utilities.drop_variables_not_in_all_datasets
-    argopy.utilities.fill_variables_not_in_all_datasets
-
-    argopy.utils.MyThreadPoolExecutor
+    argopy.utils.monitor_status
+
+    argopy.utils.show_versions
+    argopy.utils.show_options
+
+    argopy.utils.clear_cache
+    argopy.utils.lscache
+
+    argopy.utils.list_available_data_src
+    argopy.utils.list_available_index_src
+    argopy.utils.list_standard_variables
+    argopy.utils.list_multiprofile_file_variables
+
+    argopy.utils.Chunker
+
+    argopy.utils.isconnected
+    argopy.utils.urlhaskeyword
+    argopy.utils.isalive
+    argopy.utils.isAPIconnected
+
+    argopy.utils.groupby_remap
+    argopy.utils.linear_interpolation_remap
+
+    argopy.utils.format_oneline
+    argopy.utils.is_box
+    argopy.utils.is_indexbox
+    argopy.utils.is_wmo
+    argopy.utils.is_cyc
+    argopy.utils.check_wmo
+    argopy.utils.check_cyc
+
+    argopy.utils.wmo2box
+
+    argopy.utils.deprecated
+
+    argopy.utils.Registry
+    argopy.utils.float_wmo
+
+    argopy.utils.drop_variables_not_in_all_datasets
+    argopy.utils.fill_variables_not_in_all_datasets
+
+    argopy.utils.MonitoredThreadPoolExecutor
+
+    argopy.related.load_dict
+    argopy.related.get_coriolis_profile_id
+    argopy.related.get_ea_profile_page
 
     argopy.related.TopoFetcher.cname
     argopy.related.TopoFetcher.define_constraints
@@ -124,7 +133,6 @@
     argopy.related.ArgoDocs.show
     argopy.related.ArgoDocs.js
 
-
     argopy.plot
     argopy.plot.dashboard
     argopy.plot.bar_plot
diff --git a/docs/api.rst b/docs/api.rst
index e3a033a9..6ae91bd8 100644
--- a/docs/api.rst
+++ b/docs/api.rst
@@ -92,7 +92,8 @@ Utilities for Argo related data
    CTDRefDataFetcher
    TopoFetcher
    ArgoDocs
-
+   related.get_coriolis_profile_id
+   related.get_ea_profile_page
 
 .. _Module Visualisation:
 
@@ -120,6 +121,7 @@ All other visualisation functions are in the :mod:`argopy.plot` submodule:
     open_sat_altim_report
     scatter_map
     bar_plot
+    scatter_plot
     latlongrid
     discrete_coloring
 
@@ -197,24 +199,24 @@ Misc
 Utilities
 =========
 
-Function under the ``argopy.utilities`` submodule.
+Function under the ``argopy.utils`` submodule.
 
-.. currentmodule:: argopy.utilities
+.. currentmodule:: argopy.utils
 
 .. autosummary::
    :toctree: generated/
 
     list_available_data_src
     list_available_index_src
-    get_coriolis_profile_id
-    get_ea_profile_page
+    list_standard_variables
+    list_multiprofile_file_variables
 
     check_wmo
     check_cyc
+
     float_wmo
     Registry
-    list_standard_variables
-    list_multiprofile_file_variables
+
     Chunker
 
     isconnected
diff --git a/docs/conf.py b/docs/conf.py
index ce9b4b1f..493f9e8a 100644
--- a/docs/conf.py
+++ b/docs/conf.py
@@ -265,6 +265,7 @@
 }
 
 # Redirects for pages that were moved to new locations
+rediraffe_redirects = "redirects.txt"
 
 rediraffe_redirects = {
     "data_fetching.rst": "user-guide/fetching-argo-data/data_selection.rst",
@@ -273,6 +274,13 @@
     "data_manipulation.rst": "user-guide/working-with-argo-data/data_manipulation.rst",
     "data_quality_control.rst": "user-guide/working-with-argo-data/data_quality_control.rst",
     "visualisation.rst": "user-guide/working-with-argo-data/visualisation.rst",
+
+    "generated/utilities.get_coriolis_profile_id.rst": "related.get_coriolis_profile_id",
+    "generated/utils.compute.MyThreadPoolExecutor": "utils.MonitoredThreadPoolExecutor",
+    "generated/utilities.ArgoNVSReferenceTables": "related.ArgoNVSReferenceTables",
+    "generated/utilities.drop_variables_not_in_all_datasets": "utils.drop_variables_not_in_all_datasets",
+    "generated/utilities.fill_variables_not_in_all_datasets": "utils.fill_variables_not_in_all_datasets",
+    "generated/utilities.load_dict": "related.load_dict",
 }
 
 googleanalytics_id = 'G-C4MWDXYMXQ'
diff --git a/docs/redirects.txt b/docs/redirects.txt
new file mode 100644
index 00000000..13950db7
--- /dev/null
+++ b/docs/redirects.txt
@@ -0,0 +1,13 @@
+# comments start with "#"
+data_fetching.rst user-guide/fetching-argo-data/data_selection.rst
+data_sources.rst user-guide/fetching-argo-data/data_sources.rst
+user_mode.rst user-guide/fetching-argo-data/user_mode.rst
+data_manipulation.rst user-guide/working-with-argo-data/data_manipulation.rst
+data_quality_control.rst user-guide/working-with-argo-data/data_quality_control.rst
+visualisation.rst user-guide/working-with-argo-data/visualisation.rst
+generated/argopy.utilities.get_coriolis_profile_id.rst generated/argopy.related.get_coriolis_profile_id.rst
+generated/argopy.utils.compute.MyThreadPoolExecutor generated/argopy.utils.MonitoredThreadPoolExecutor.rst
+generated/argopy.utilities.ArgoNVSReferenceTables generated/argopy.related.ArgoNVSReferenceTables.rst
+generated/argopy.utilities.drop_variables_not_in_all_datasets generated/argopy.utils.drop_variables_not_in_all_datasets.rst
+generated/argopy.utilities.fill_variables_not_in_all_datasets generated/argopy.utils.fill_variables_not_in_all_datasets.rst
+generated/argopy.utilities.load_dict generated/argopy.related.load_dict.rst
\ No newline at end of file
diff --git a/docs/whats-new.rst b/docs/whats-new.rst
index 97b13938..06e3bcdb 100644
--- a/docs/whats-new.rst
+++ b/docs/whats-new.rst
@@ -73,7 +73,7 @@ Check out the new documentation page for :ref:`data-set`. (:pr:`278`) by `G. Maz
 
 **Internals**
 
-- New utility class :class:`utils.compute.MyThreadPoolExecutor` to handle parallelization with a multi-threading Pool that provide a notebook or terminal computation progress dashboard. This class is used by the httpstore open_mfdataset method for erddap requests.
+- New utility class :class:`utils.MonitoredThreadPoolExecutor` to handle parallelization with a multi-threading Pool that provide a notebook or terminal computation progress dashboard. This class is used by the httpstore open_mfdataset method for erddap requests.
 
 - New utilites to handle a collection of datasets: :func:`utilities.drop_variables_not_in_all_datasets` will drop variables that are not in all datasets (the lowest common denominator) and :func:`utilities.fill_variables_not_in_all_datasets` will add empty variables to dataset so that all the collection have the same data_vars and coords. These functions are used by stores to concat/merge a collection of datasets (chunks).
 

From e28ea34919e942b998c9fbfb72672a6ab116ff03 Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Mon, 18 Sep 2023 10:42:01 +0200
Subject: [PATCH 25/33] misc

---
 docs/conf.py       |  2 +-
 docs/redirects.txt | 12 ++++++------
 docs/whats-new.rst |  4 ++--
 3 files changed, 9 insertions(+), 9 deletions(-)

diff --git a/docs/conf.py b/docs/conf.py
index 493f9e8a..4772385a 100644
--- a/docs/conf.py
+++ b/docs/conf.py
@@ -252,7 +252,7 @@
              "image_dark": "_static/argopy_logo_long_dark.png"
              },
     # "display_version": True,
-    "logo_only": True,
+    # "logo_only": True,
     # "show_navbar_depth": 2,  # https://sphinx-book-theme.readthedocs.io/en/stable/customize/sidebar-primary.html?highlight=logo#control-the-depth-of-the-left-sidebar-lists-to-expand
 
     "show_nav_level": 1,  # https://pydata-sphinx-theme.readthedocs.io/en/latest/user_guide/navigation.html#control-how-many-navigation-levels-are-shown-by-default
diff --git a/docs/redirects.txt b/docs/redirects.txt
index 13950db7..bb2117cf 100644
--- a/docs/redirects.txt
+++ b/docs/redirects.txt
@@ -5,9 +5,9 @@ user_mode.rst user-guide/fetching-argo-data/user_mode.rst
 data_manipulation.rst user-guide/working-with-argo-data/data_manipulation.rst
 data_quality_control.rst user-guide/working-with-argo-data/data_quality_control.rst
 visualisation.rst user-guide/working-with-argo-data/visualisation.rst
-generated/argopy.utilities.get_coriolis_profile_id.rst generated/argopy.related.get_coriolis_profile_id.rst
-generated/argopy.utils.compute.MyThreadPoolExecutor generated/argopy.utils.MonitoredThreadPoolExecutor.rst
-generated/argopy.utilities.ArgoNVSReferenceTables generated/argopy.related.ArgoNVSReferenceTables.rst
-generated/argopy.utilities.drop_variables_not_in_all_datasets generated/argopy.utils.drop_variables_not_in_all_datasets.rst
-generated/argopy.utilities.fill_variables_not_in_all_datasets generated/argopy.utils.fill_variables_not_in_all_datasets.rst
-generated/argopy.utilities.load_dict generated/argopy.related.load_dict.rst
\ No newline at end of file
+argopy.utilities.get_coriolis_profile_id.rst argopy.related.get_coriolis_profile_id.rst
+# generated/argopy.utils.compute.MyThreadPoolExecutor generated/argopy.utils.MonitoredThreadPoolExecutor.rst
+# generated/argopy.utilities.ArgoNVSReferenceTables generated/argopy.related.ArgoNVSReferenceTables.rst
+# generated/argopy.utilities.drop_variables_not_in_all_datasets generated/argopy.utils.drop_variables_not_in_all_datasets.rst
+# generated/argopy.utilities.fill_variables_not_in_all_datasets generated/argopy.utils.fill_variables_not_in_all_datasets.rst
+# generated/argopy.utilities.load_dict generated/argopy.related.load_dict.rst
\ No newline at end of file
diff --git a/docs/whats-new.rst b/docs/whats-new.rst
index 06e3bcdb..36fe4cac 100644
--- a/docs/whats-new.rst
+++ b/docs/whats-new.rst
@@ -13,7 +13,7 @@ Coming up next
 
 **Internals**
 
-- Utilities refactoring. Each class/function have been refactored in more appropriate locations like ``argopy.utils`` or ``argopy.relatec``.
+- Utilities refactoring. Each class/function have been refactored in more appropriate locations like ``argopy.utils`` or ``argopy.related``.
 
 v0.1.14rc2 (27 Jul. 2023)
 -------------------------
@@ -21,7 +21,7 @@ v0.1.14rc2 (27 Jul. 2023)
 **Features and front-end API**
 
 - **argopy now support BGC dataset in `expert` user mode for the `erddap` data source**. The BGC-Argo content of synthetic multi-profile files is now available from the Ifremer erddap. Like for the core dataset, you can fetch data for a region, float(s) or profile(s). One novelty with regard to core, is that you can restrict data fetching to some parameters and furthermore impose no-NaNs on some of these parameters.
-Check out the new documentation page for :ref:`data-set`. (:pr:`278`) by `G. Maze <http://www.github.com/gmaze>`_
+ Check out the new documentation page for :ref:`data-set`. (:pr:`278`) by `G. Maze <http://www.github.com/gmaze>`_
 
 .. code-block:: python
 

From 48a039de690677921b00ab6c4c09b90722ba9ad5 Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Mon, 18 Sep 2023 10:47:53 +0200
Subject: [PATCH 26/33] Update argo_documentation.py

---
 argopy/related/argo_documentation.py | 14 +++++++++++++-
 1 file changed, 13 insertions(+), 1 deletion(-)

diff --git a/argopy/related/argo_documentation.py b/argopy/related/argo_documentation.py
index 0ed70a39..84806486 100644
--- a/argopy/related/argo_documentation.py
+++ b/argopy/related/argo_documentation.py
@@ -153,7 +153,19 @@ class ArgoDocs:
             "title": "Argo GDAC cookbook",
             "doi": "10.13155/46202",
             "id": 46202
-        }
+        },
+        {
+            "category": "Cookbooks",
+            "title": "Processing BGC-Argo pH data at the DAC level",
+            "doi": "10.13155/57195",
+            "id": 57195
+        },
+        {
+            "category": "Cookbooks",
+            "title": "Processing BGC-Argo nitrate concentration at the DAC Level",
+            "doi": "10.13155/46121",
+            "id": 46121
+        },
     ]
 
     class RIS:

From 9e0af220a7202095f98389208026d3459490bb73 Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Mon, 18 Sep 2023 11:04:39 +0200
Subject: [PATCH 27/33] fix documentation

---
 argopy/stores/filesystems.py | 2 +-
 docs/conf.py                 | 7 -------
 2 files changed, 1 insertion(+), 8 deletions(-)

diff --git a/argopy/stores/filesystems.py b/argopy/stores/filesystems.py
index 28a665aa..a74d321b 100644
--- a/argopy/stores/filesystems.py
+++ b/argopy/stores/filesystems.py
@@ -914,7 +914,7 @@ def open_mfdataset(
                 - :class:`distributed.client.Client`: Experimental, expect this method to fail !
                 - ``seq``: open data sequentially, no parallelization applied
                 - ``erddap``:  use a pool of at most ``max_workers`` threads, comes with a nice dashboard dedicated
-                to erddap server requests.
+                    to erddap server requests.
         progress: bool, default: False
             Display a progress bar
         concat: bool, default: True
diff --git a/docs/conf.py b/docs/conf.py
index 4772385a..13aa48af 100644
--- a/docs/conf.py
+++ b/docs/conf.py
@@ -274,13 +274,6 @@
     "data_manipulation.rst": "user-guide/working-with-argo-data/data_manipulation.rst",
     "data_quality_control.rst": "user-guide/working-with-argo-data/data_quality_control.rst",
     "visualisation.rst": "user-guide/working-with-argo-data/visualisation.rst",
-
-    "generated/utilities.get_coriolis_profile_id.rst": "related.get_coriolis_profile_id",
-    "generated/utils.compute.MyThreadPoolExecutor": "utils.MonitoredThreadPoolExecutor",
-    "generated/utilities.ArgoNVSReferenceTables": "related.ArgoNVSReferenceTables",
-    "generated/utilities.drop_variables_not_in_all_datasets": "utils.drop_variables_not_in_all_datasets",
-    "generated/utilities.fill_variables_not_in_all_datasets": "utils.fill_variables_not_in_all_datasets",
-    "generated/utilities.load_dict": "related.load_dict",
 }
 
 googleanalytics_id = 'G-C4MWDXYMXQ'

From 8ca4c954d89e173688cd1e84e54c07d10ce51e89 Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Mon, 18 Sep 2023 11:22:00 +0200
Subject: [PATCH 28/33] Update utilities.py

---
 argopy/utilities.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/argopy/utilities.py b/argopy/utilities.py
index 33b35c67..f78355e1 100644
--- a/argopy/utilities.py
+++ b/argopy/utilities.py
@@ -153,6 +153,7 @@ def to_list(*args, **kwargs):
 def cast_Argo_variable_type(*args, **kwargs):
     pass
 
+from .utils.casting import DATA_TYPES
 
 # Decorators
 

From dcd92ab135b7b330108deb83a8d8d847fafecbd1 Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Mon, 18 Sep 2023 11:22:34 +0200
Subject: [PATCH 29/33] move ADMT docs list to assets

---
 argopy/related/argo_documentation.py          | 155 +-----------------
 .../assets/admt_documentation_catalogue.json  | 153 +++++++++++++++++
 2 files changed, 162 insertions(+), 146 deletions(-)
 create mode 100644 argopy/static/assets/admt_documentation_catalogue.json

diff --git a/argopy/related/argo_documentation.py b/argopy/related/argo_documentation.py
index 84806486..a182e035 100644
--- a/argopy/related/argo_documentation.py
+++ b/argopy/related/argo_documentation.py
@@ -1,7 +1,15 @@
+import os
+import json
 import pandas as pd
 from functools import lru_cache
 from ..stores import httpstore
 from ..options import OPTIONS
+from .utils import path2assets
+
+
+# Load the ADMT documentation catalogue:
+with open(os.path.join(path2assets, "admt_documentation_catalogue.json"), "rb") as f:
+    ADMT_CATALOGUE = json.load(f)['data']['catalogue']
 
 
 class ArgoDocs:
@@ -21,152 +29,7 @@ class ArgoDocs:
     >>> ArgoDocs(35385).open_pdf(page=12)
 
     """
-    _catalogue = [
-        {
-            "category": "Argo data formats",
-            "title": "Argo user's manual",
-            "doi": "10.13155/29825",
-            "id": 29825
-        },
-        {
-            "category": "Quality control",
-            "title": "Argo Quality Control Manual for CTD and Trajectory Data",
-            "doi": "10.13155/33951",
-            "id": 33951
-        },
-        {
-            "category": "Quality control",
-            "title": "Argo quality control manual for dissolved oxygen concentration",
-            "doi": "10.13155/46542",
-            "id": 46542
-        },
-        {
-            "category": "Quality control",
-            "title": "Argo quality control manual for biogeochemical data",
-            "doi": "10.13155/40879",
-            "id": 40879
-        },
-        {
-            "category": "Quality control",
-            "title": "BGC-Argo quality control manual for the Chlorophyll-A concentration",
-            "doi": "10.13155/35385",
-            "id": 35385
-        },
-        {
-            "category": "Quality control",
-            "title": "BGC-Argo quality control manual for nitrate concentration",
-            "doi": "10.13155/84370",
-            "id": 84370
-        },
-        {
-            "category": "Quality control",
-            "title": "Quality control for BGC-Argo radiometry",
-            "doi": "10.13155/62466",
-            "id": 62466
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Argo DAC profile cookbook",
-            "doi": "10.13155/41151",
-            "id": 41151
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Argo DAC trajectory cookbook",
-            "doi": "10.13155/29824",
-            "id": 29824
-        },
-        {
-            "category": "Cookbooks",
-            "title": "DMQC Cookbook for Core Argo parameters",
-            "doi": "10.13155/78994",
-            "id": 78994
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Processing Argo oxygen data at the DAC level",
-            "doi": "10.13155/39795",
-            "id": 39795
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Processing Bio-Argo particle backscattering at the DAC level",
-            "doi": "10.13155/39459",
-            "id": 39459
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Processing BGC-Argo chlorophyll-A concentration at the DAC level",
-            "doi": "10.13155/39468",
-            "id": 39468
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Processing Argo measurement timing information at the DAC level",
-            "doi": "10.13155/47998",
-            "id": 47998
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Processing BGC-Argo CDOM concentration at the DAC level",
-            "doi": "10.13155/54541",
-            "id": 54541
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Processing Bio-Argo nitrate concentration at the DAC Level",
-            "doi": "10.13155/46121",
-            "id": 46121
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Processing BGC-Argo Radiometric data at the DAC level",
-            "doi": "10.13155/51541",
-            "id": 51541
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Processing BGC-Argo pH data at the DAC level",
-            "doi": "10.13155/57195",
-            "id": 57195
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Description of the Argo GDAC File Checks: Data Format and Consistency Checks",
-            "doi": "10.13155/46120",
-            "id": 46120
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Description of the Argo GDAC File Merge Process",
-            "doi": "10.13155/52154",
-            "id": 52154
-        },
-        {
-            "category": "Cookbooks",
-            "title": "BGC-Argo synthetic profile file processing and format on Coriolis GDAC",
-            "doi": "10.13155/55637",
-            "id": 55637
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Argo GDAC cookbook",
-            "doi": "10.13155/46202",
-            "id": 46202
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Processing BGC-Argo pH data at the DAC level",
-            "doi": "10.13155/57195",
-            "id": 57195
-        },
-        {
-            "category": "Cookbooks",
-            "title": "Processing BGC-Argo nitrate concentration at the DAC Level",
-            "doi": "10.13155/46121",
-            "id": 46121
-        },
-    ]
+    _catalogue = ADMT_CATALOGUE
 
     class RIS:
         """RIS file structure from TXT file"""
diff --git a/argopy/static/assets/admt_documentation_catalogue.json b/argopy/static/assets/admt_documentation_catalogue.json
new file mode 100644
index 00000000..fa0b28b5
--- /dev/null
+++ b/argopy/static/assets/admt_documentation_catalogue.json
@@ -0,0 +1,153 @@
+{
+  "name": "ADMT documentation catalogue",
+  "long_name": "Titles and DOIs of all the official ADMT documentation",
+  "last_update": "2023-09-18T09:14:50.015167+00:00",
+  "data": {
+    "catalogue": [
+      {
+        "category": "Argo data formats",
+        "title": "Argo user's manual",
+        "doi": "10.13155/29825",
+        "id": 29825
+      },
+      {
+        "category": "Quality control",
+        "title": "Argo Quality Control Manual for CTD and Trajectory Data",
+        "doi": "10.13155/33951",
+        "id": 33951
+      },
+      {
+        "category": "Quality control",
+        "title": "Argo quality control manual for dissolved oxygen concentration",
+        "doi": "10.13155/46542",
+        "id": 46542
+      },
+      {
+        "category": "Quality control",
+        "title": "Argo quality control manual for biogeochemical data",
+        "doi": "10.13155/40879",
+        "id": 40879
+      },
+      {
+        "category": "Quality control",
+        "title": "BGC-Argo quality control manual for the Chlorophyll-A concentration",
+        "doi": "10.13155/35385",
+        "id": 35385
+      },
+      {
+        "category": "Quality control",
+        "title": "BGC-Argo quality control manual for nitrate concentration",
+        "doi": "10.13155/84370",
+        "id": 84370
+      },
+      {
+        "category": "Quality control",
+        "title": "Quality control for BGC-Argo radiometry",
+        "doi": "10.13155/62466",
+        "id": 62466
+      },
+      {
+        "category": "Cookbooks",
+        "title": "Argo DAC profile cookbook",
+        "doi": "10.13155/41151",
+        "id": 41151
+      },
+      {
+        "category": "Cookbooks",
+        "title": "Argo DAC trajectory cookbook",
+        "doi": "10.13155/29824",
+        "id": 29824
+      },
+      {
+        "category": "Cookbooks",
+        "title": "DMQC Cookbook for Core Argo parameters",
+        "doi": "10.13155/78994",
+        "id": 78994
+      },
+      {
+        "category": "Cookbooks",
+        "title": "Processing Argo oxygen data at the DAC level",
+        "doi": "10.13155/39795",
+        "id": 39795
+      },
+      {
+        "category": "Cookbooks",
+        "title": "Processing Bio-Argo particle backscattering at the DAC level",
+        "doi": "10.13155/39459",
+        "id": 39459
+      },
+      {
+        "category": "Cookbooks",
+        "title": "Processing BGC-Argo chlorophyll-A concentration at the DAC level",
+        "doi": "10.13155/39468",
+        "id": 39468
+      },
+      {
+        "category": "Cookbooks",
+        "title": "Processing Argo measurement timing information at the DAC level",
+        "doi": "10.13155/47998",
+        "id": 47998
+      },
+      {
+        "category": "Cookbooks",
+        "title": "Processing BGC-Argo CDOM concentration at the DAC level",
+        "doi": "10.13155/54541",
+        "id": 54541
+      },
+      {
+        "category": "Cookbooks",
+        "title": "Processing Bio-Argo nitrate concentration at the DAC Level",
+        "doi": "10.13155/46121",
+        "id": 46121
+      },
+      {
+        "category": "Cookbooks",
+        "title": "Processing BGC-Argo Radiometric data at the DAC level",
+        "doi": "10.13155/51541",
+        "id": 51541
+      },
+      {
+        "category": "Cookbooks",
+        "title": "Processing BGC-Argo pH data at the DAC level",
+        "doi": "10.13155/57195",
+        "id": 57195
+      },
+      {
+        "category": "Cookbooks",
+        "title": "Description of the Argo GDAC File Checks: Data Format and Consistency Checks",
+        "doi": "10.13155/46120",
+        "id": 46120
+      },
+      {
+        "category": "Cookbooks",
+        "title": "Description of the Argo GDAC File Merge Process",
+        "doi": "10.13155/52154",
+        "id": 52154
+      },
+      {
+        "category": "Cookbooks",
+        "title": "BGC-Argo synthetic profile file processing and format on Coriolis GDAC",
+        "doi": "10.13155/55637",
+        "id": 55637
+      },
+      {
+        "category": "Cookbooks",
+        "title": "Argo GDAC cookbook",
+        "doi": "10.13155/46202",
+        "id": 46202
+      },
+      {
+        "category": "Cookbooks",
+        "title": "Processing BGC-Argo pH data at the DAC level",
+        "doi": "10.13155/57195",
+        "id": 57195
+      },
+      {
+        "category": "Cookbooks",
+        "title": "Processing BGC-Argo nitrate concentration at the DAC Level",
+        "doi": "10.13155/46121",
+        "id": 46121
+      }
+    ]
+  }
+}
\ No newline at end of file

From 009727dbe834185b181e88ecb70b96052b5ba28b Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Mon, 18 Sep 2023 11:43:59 +0200
Subject: [PATCH 30/33] fix doc

---
 docs/metadata_fetching.rst | 6 +++---
 docs/redirects.txt         | 2 +-
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/docs/metadata_fetching.rst b/docs/metadata_fetching.rst
index 319b653f..1ccbe45c 100644
--- a/docs/metadata_fetching.rst
+++ b/docs/metadata_fetching.rst
@@ -282,7 +282,7 @@ Two specific index variables are only available with BGC-Argo index files: ``PAR
 
 Reference tables
 ----------------
-.. currentmodule:: argopy.utilities
+.. currentmodule:: argopy.related
 
 The Argo netcdf format is strict and based on a collection of variables fully documented and conventioned. All reference tables can be found in the `Argo user manual <https://doi.org/10.13155/29825>`_.
 
@@ -331,7 +331,7 @@ The full list of all available tables is given by the :meth:`ArgoNVSReferenceTab
 
 Deployment Plan
 ---------------
-.. currentmodule:: argopy.utilities
+.. currentmodule:: argopy.related
 
 It may be useful to be able to retrieve meta-data from Argo deployments. **argopy** can use the `OceanOPS API for metadata access <https://www.ocean-ops.org/api/swagger/?url=https://www.ocean-ops.org/api/1/oceanops-api.yaml>`_ to retrieve these information. The returned deployment `plan` is a list of all Argo floats ever deployed, together with their deployment location, date, WMO, program, country, float model and current status.
 
@@ -385,7 +385,7 @@ Last, :class:`OceanOPSDeployments` comes with a plotting method:
 
 ADMT Documentation
 ------------------
-.. currentmodule:: argopy.utilities
+.. currentmodule:: argopy.related
 
 More than 20 pdf manuals have been produced by the Argo Data Management Team. Using the :class:`ArgoDocs` class, it's easy to navigate this great database.
 
diff --git a/docs/redirects.txt b/docs/redirects.txt
index bb2117cf..e2e989f2 100644
--- a/docs/redirects.txt
+++ b/docs/redirects.txt
@@ -7,7 +7,7 @@ data_quality_control.rst user-guide/working-with-argo-data/data_quality_control.
 visualisation.rst user-guide/working-with-argo-data/visualisation.rst
 argopy.utilities.get_coriolis_profile_id.rst argopy.related.get_coriolis_profile_id.rst
 # generated/argopy.utils.compute.MyThreadPoolExecutor generated/argopy.utils.MonitoredThreadPoolExecutor.rst
-# generated/argopy.utilities.ArgoNVSReferenceTables generated/argopy.related.ArgoNVSReferenceTables.rst
+generated/argopy.utilities.ArgoNVSReferenceTables.rst generated/argopy.related.ArgoNVSReferenceTables.rst
 # generated/argopy.utilities.drop_variables_not_in_all_datasets generated/argopy.utils.drop_variables_not_in_all_datasets.rst
 # generated/argopy.utilities.fill_variables_not_in_all_datasets generated/argopy.utils.fill_variables_not_in_all_datasets.rst
 # generated/argopy.utilities.load_dict generated/argopy.related.load_dict.rst
\ No newline at end of file

From 77be87c2e0f8ace4bc2a5a18fe6bc06c6904e175 Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Mon, 18 Sep 2023 15:51:39 +0200
Subject: [PATCH 31/33] More doc fixes

---
 argopy/utils/transform.py | 24 ++++++++++++++++--------
 docs/api-hidden.rst       |  1 +
 docs/whats-new.rst        | 17 ++++++++---------
 3 files changed, 25 insertions(+), 17 deletions(-)

diff --git a/argopy/utils/transform.py b/argopy/utils/transform.py
index e0e0c4de..4dfb30e7 100644
--- a/argopy/utils/transform.py
+++ b/argopy/utils/transform.py
@@ -4,21 +4,23 @@
 import numpy as np
 import xarray as xr
 import logging
+from typing import List
 
 
 log = logging.getLogger("argopy.utils.manip")
 
 
-def drop_variables_not_in_all_datasets(ds_collection):
+def drop_variables_not_in_all_datasets(ds_collection: List[xr.Dataset]) -> List[xr.Dataset]:
     """Drop variables that are not in all datasets (the lowest common denominator)
 
     Parameters
     ----------
-    list of :class:`xr.DataSet`
+    ds_collection: List[xarray.Dataset]
+        A list of :class:`xarray.Dataset`
 
     Returns
     -------
-    list of :class:`xr.DataSet`
+    List[xarray.Dataset]
     """
 
     # List all possible data variables:
@@ -27,7 +29,7 @@ def drop_variables_not_in_all_datasets(ds_collection):
         [vlist.append(v) for v in list(res.data_vars)]
     vlist = np.unique(vlist)
 
-    # Check if each variables are in each datasets:
+    # Check if each variable are in each dataset:
     ishere = np.zeros((len(vlist), len(ds_collection)))
     for ir, res in enumerate(ds_collection):
         for iv, v in enumerate(res.data_vars):
@@ -57,18 +59,24 @@ def drop_variables_not_in_all_datasets(ds_collection):
     return ds_collection
 
 
-def fill_variables_not_in_all_datasets(ds_collection, concat_dim="rows"):
-    """Add empty variables to dataset so that all the collection have the same data_vars and coords
+def fill_variables_not_in_all_datasets(
+    ds_collection: List[xr.Dataset], concat_dim: str = "rows"
+) -> List[xr.Dataset]:
+    """Add empty variables to dataset so that all the collection have the same :attr:`xarray.Dataset.data_vars` and :props:`xarray.Dataset.coords`
 
     This is to make sure that the collection of dataset can be concatenated
 
     Parameters
     ----------
-    list of :class:`xr.DataSet`
+    ds_collection: List[xarray.Dataset]
+        A list of :class:`xarray.Dataset`
+    concat_dim: str, default='rows'
+        Name of the dimension to use to create new variables. Typically, this is the name of the dimension the collection will
+        be concatenated along afterward.
 
     Returns
     -------
-    list of :class:`xr.DataSet`
+    List[xarray.Dataset]
     """
 
     def first_variable_with_concat_dim(this_ds, concat_dim="rows"):
diff --git a/docs/api-hidden.rst b/docs/api-hidden.rst
index 9a5cfa78..2b25323e 100644
--- a/docs/api-hidden.rst
+++ b/docs/api-hidden.rst
@@ -137,6 +137,7 @@
     argopy.plot.dashboard
     argopy.plot.bar_plot
     argopy.plot.scatter_map
+    argopy.plot.scatter_plot
     argopy.plot.plot_trajectory
     argopy.plot.latlongrid
     argopy.plot.discrete_coloring
diff --git a/docs/whats-new.rst b/docs/whats-new.rst
index 36fe4cac..623cfa95 100644
--- a/docs/whats-new.rst
+++ b/docs/whats-new.rst
@@ -13,15 +13,14 @@ Coming up next
 
 **Internals**
 
-- Utilities refactoring. Each class/function have been refactored in more appropriate locations like ``argopy.utils`` or ``argopy.related``.
+- Utilities refactoring. All classes and functions have been refactored to more appropriate locations like ``argopy.utils`` or ``argopy.related``. A deprecation warning message will be displayed every time utilities are being used from the former locations. (:pr:`290`) by `G. Maze <http://www.github.com/gmaze>`_
 
 v0.1.14rc2 (27 Jul. 2023)
 -------------------------
 
 **Features and front-end API**
 
-- **argopy now support BGC dataset in `expert` user mode for the `erddap` data source**. The BGC-Argo content of synthetic multi-profile files is now available from the Ifremer erddap. Like for the core dataset, you can fetch data for a region, float(s) or profile(s). One novelty with regard to core, is that you can restrict data fetching to some parameters and furthermore impose no-NaNs on some of these parameters.
- Check out the new documentation page for :ref:`data-set`. (:pr:`278`) by `G. Maze <http://www.github.com/gmaze>`_
+- **argopy now support BGC dataset in `expert` user mode for the `erddap` data source**. The BGC-Argo content of synthetic multi-profile files is now available from the Ifremer erddap. Like for the core dataset, you can fetch data for a region, float(s) or profile(s). One novelty with regard to core, is that you can restrict data fetching to some parameters and furthermore impose no-NaNs on some of these parameters. Check out the new documentation page for :ref:`data-set`. (:pr:`278`) by `G. Maze <http://www.github.com/gmaze>`_
 
 .. code-block:: python
 
@@ -61,7 +60,7 @@ v0.1.14rc2 (27 Jul. 2023)
 
 - **New xarray argo accessor features**. Easily retrieve an Argo sample index and domain extent with the ``index`` and ``domain`` properties. Get a list with all possible (PLATFORM_NUMBER, CYCLE_NUMBER) with the ``list_WMO_CYC`` method. (:pr:`278`) by `G. Maze <http://www.github.com/gmaze>`_
 
-- **New search methods for Argo reference tables**. It is now possible to search for a string in tables title and/or description using the :meth:`utilities.ArgoNVSReferenceTables.search` method.
+- **New search methods for Argo reference tables**. It is now possible to search for a string in tables title and/or description using the :meth:`related.ArgoNVSReferenceTables.search` method.
 
 .. code-block:: python
 
@@ -75,17 +74,17 @@ v0.1.14rc2 (27 Jul. 2023)
 
 - New utility class :class:`utils.MonitoredThreadPoolExecutor` to handle parallelization with a multi-threading Pool that provide a notebook or terminal computation progress dashboard. This class is used by the httpstore open_mfdataset method for erddap requests.
 
-- New utilites to handle a collection of datasets: :func:`utilities.drop_variables_not_in_all_datasets` will drop variables that are not in all datasets (the lowest common denominator) and :func:`utilities.fill_variables_not_in_all_datasets` will add empty variables to dataset so that all the collection have the same data_vars and coords. These functions are used by stores to concat/merge a collection of datasets (chunks).
+- New utilites to handle a collection of datasets: :func:`utils.drop_variables_not_in_all_datasets` will drop variables that are not in all datasets (the lowest common denominator) and :func:`utils.fill_variables_not_in_all_datasets` will add empty variables to dataset so that all the collection have the same data_vars and coords. These functions are used by stores to concat/merge a collection of datasets (chunks).
 
-- :func:`utilities.load_dict` now relies on :class:`ArgoNVSReferenceTables` instead of static pickle files.
+- :func:`related.load_dict` now relies on :class:`ArgoNVSReferenceTables` instead of static pickle files.
 
 - :class:`argopy.ArgoColors` colormap for Argo Data-Mode has now a fourth value to account for a white space FillValue.
 
-- New quick and dirty plot method :func:`plot.plot.scatter_plot`
+- New quick and dirty plot method :func:`plot.scatter_plot`
 
 - Refactor pickle files in argopy/assets as json files in argopy/static/assets
 
-- Refactor list of variables by data types used in :func:`utilities.cast_Argo_variable_type` into assets json files in argopy/static/assets
+- Refactor list of variables by data types used in :func:`utils.cast_Argo_variable_type` into assets json files in argopy/static/assets
 
 - Change of behaviour: when setting the cachedir option, path it's not tested for existence but for being writable, and is created if doesn't exists (but seems to break CI upstream in Windows)
 
@@ -109,7 +108,7 @@ v0.1.14rc1 (31 May 2023)
 
 - **Our internal Argo index store is promoted as a frontend feature**. The :class:`IndexFetcher` is a user-friendly **fetcher** built on top of our internal Argo index file store. But if you are familiar with Argo index files and/or cares about performances, you may be interested in using directly the Argo index **store**. We thus decided to promote this internal feature as a frontend class :class:`ArgoIndex`. See :ref:`Store: Low-level Argo Index access`. (:pr:`270`) by `G. Maze <http://www.github.com/gmaze>`_
 
-- **Easy access to all Argo manuals from the ADMT**. More than 20 pdf manuals have been produced by the Argo Data Management Team. Using the new ``ArgoDocs`` class, it's now easier to navigate this great database for Argo experts. All details in :ref:`ADMT Documentation`. (:pr:`268`) by `G. Maze <http://www.github.com/gmaze>`_
+- **Easy access to all Argo manuals from the ADMT**. More than 20 pdf manuals have been produced by the Argo Data Management Team. Using the new :class:`ArgoDocs` class, it's now easier to navigate this great database for Argo experts. All details in :ref:`ADMT Documentation`. (:pr:`268`) by `G. Maze <http://www.github.com/gmaze>`_
 
 .. code-block:: python
 

From 79f4b402010b95a5482d7c67ec550b77d2664d77 Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Tue, 26 Sep 2023 11:32:10 +0200
Subject: [PATCH 32/33] Remove deprecated unicode in doc [skip-ci]

---
 docs/index.rst                                 |  6 +++---
 docs/install.rst                               |  6 +++---
 docs/metadata_fetching.rst                     |  2 +-
 .../user-guide/fetching-argo-data/data_set.rst | 18 +++++++++---------
 .../fetching-argo-data/data_sources.rst        | 10 +++++-----
 .../fetching-argo-data/user_mode.rst           |  2 +-
 .../working-with-argo-data/visualisation.rst   |  2 +-
 docs/whats-new.rst                             |  7 +++++--
 8 files changed, 28 insertions(+), 25 deletions(-)

diff --git a/docs/index.rst b/docs/index.rst
index 3a550936..10eda757 100644
--- a/docs/index.rst
+++ b/docs/index.rst
@@ -10,9 +10,9 @@ for standard users as well as Argo experts.
 
 .. versionadded:: v0.1.14rc2
 
-    - Rolling out incremental support for 🟢 **bgc** variables 🎉
-    - New :ref:`Gallery of notebook examples <Gallery>` for 🟢 **bgc** variables
-    - Follow specific install instructions :ref:`here <bgc-install>` for 🟢 **bgc** support
+    - Rolling out incremental support for **bgc** variables 🎉
+    - New :ref:`Gallery of notebook examples <Gallery>` for **bgc** variables
+    - Follow specific install instructions :ref:`here <bgc-install>` for **bgc** support
     - Check out a brief overview of new features on the :ref:`What's New` page
 
 
diff --git a/docs/install.rst b/docs/install.rst
index 0143ab83..0e026f1f 100644
--- a/docs/install.rst
+++ b/docs/install.rst
@@ -29,14 +29,14 @@ you can also work with the latest version:
 
 .. _bgc-install:
 
-Install release with partial 🟢 **bgc** support
+Install release with partial **bgc** support
 -----------------------------------------------
 
 .. versionadded:: v0.1.14rc2
 
-🟢 **bgc** support is provided as a **release candidate** only. Therefore, it is not available in conda and won't be selected by default with pip.
+**bgc** support is provided as a **release candidate** only. Therefore, it is not available in conda and won't be selected by default with pip.
 
-To install **argopy** with *partial* 🟢 **bgc** support, you need to use:
+To install **argopy** with *partial* **bgc** support, you need to use:
 
 .. code-block:: text
 
diff --git a/docs/metadata_fetching.rst b/docs/metadata_fetching.rst
index 1ccbe45c..ab2e870c 100644
--- a/docs/metadata_fetching.rst
+++ b/docs/metadata_fetching.rst
@@ -174,7 +174,7 @@ And finally the list of methods and properties for **search results**:
 
 .. _metadata-index-bgc:
 
-Usage with 🟢 **bgc** index
+Usage with **bgc** index
 """""""""""""""""""""""""""
 
 The **argopy** index store supports the Bio and Synthetic Profile directory files:
diff --git a/docs/user-guide/fetching-argo-data/data_set.rst b/docs/user-guide/fetching-argo-data/data_set.rst
index 13bd5261..406c485b 100644
--- a/docs/user-guide/fetching-argo-data/data_set.rst
+++ b/docs/user-guide/fetching-argo-data/data_set.rst
@@ -1,8 +1,8 @@
 .. currentmodule:: argopy
 .. _data-set:
 
-Dataset (🟡+🔵 vs 🟢)
-######################
+Dataset
+#######
 
 |Profile count| |Profile BGC count|
 
@@ -21,9 +21,9 @@ Dataset (🟡+🔵 vs 🟢)
 
 But they are several Argo `missions <https://argo.ucsd.edu/about/mission>`_ with specific files and parameters that need special handling by **argopy**, namely:
 
-- 🟡 the core Argo Mission:  from floats that measure temperature, salinity, pressure down to 2000m,
-- 🔵 the `Deep Argo Mission <https://argo.ucsd.edu/expansion/deep-argo-mission>`_:  from floats that measure temperature, salinity, pressure down to 6000m,
-- 🟢 and the `BGC-Argo Mission <https://biogeochemical-argo.org>`_:  from floats that measure temperature, salinity, pressure and oxygen, pH, nitrate, chlorophyll, backscatter, irradiance down to 2000m.
+- the core Argo Mission:  from floats that measure temperature, salinity, pressure down to 2000m,
+- the `Deep Argo Mission <https://argo.ucsd.edu/expansion/deep-argo-mission>`_:  from floats that measure temperature, salinity, pressure down to 6000m,
+- and the `BGC-Argo Mission <https://biogeochemical-argo.org>`_:  from floats that measure temperature, salinity, pressure and oxygen, pH, nitrate, chlorophyll, backscatter, irradiance down to 2000m.
 
 
 Argo dataset available in **argopy**
@@ -33,11 +33,11 @@ In **argopy** we simply make the difference between physical and biogeochemical
 
 In **argopy** you can thus get access to the following Argo data:
 
-1. 🟡+ 🔵 the **phy** dataset, for *physical* parameters.
+1. the **phy** dataset, for *physical* parameters.
     This dataset provides data from floats that measure temperature, salinity, pressure, without limitation in depth. It is available from all :ref:`Available data sources`.
     Since this is the most common Argo data subset it's selected with the ``phy`` keyword by default in **argopy**.
 
-2. 🟢 the **bgc** dataset, for *biogeochemical* parameters.
+2. the **bgc** dataset, for *biogeochemical* parameters.
     This dataset provides data from floats that measure temperature, salinity, pressure and oxygen, pH, nitrate, chlorophyll, backscatter, irradiance, without limitation in depth.
     You can select this dataset with the keyword ``bgc`` and methods described below.
 
@@ -75,7 +75,7 @@ You have several ways to specify which dataset you want to use:
 
     In the future, we could consider to add more mission specific keywords for the ``dataset`` option and ``ds`` fetcher argument of :class:`DataFetcher`. This could be *deep* for instance. Please `raise an gitHub "issue" <https://github.com/euroargodev/argopy/issues/new>`_ if you may require such a new feature.
 
-The 🟢 **bgc** dataset
+The **bgc** dataset
 **********************
 .. role:: python(code)
    :language: python
@@ -84,7 +84,7 @@ The 🟢 **bgc** dataset
 
     At this time, BGC parameters are only available in ``expert`` :ref:`user mode <user-mode>` and with the ``erddap`` :ref:`data source <data-sources>`.
 
-All **argopy** features work with the 🟡+ 🔵 **phy** dataset. However, they are some specific methods dedicated to the 🟢 **bgc** dataset that we now describe.
+All **argopy** features work with the **phy** dataset. However, they are some specific methods dedicated to the **bgc** dataset that we now describe.
 
 Specifics in :class:`DataFetcher`
 =================================
diff --git a/docs/user-guide/fetching-argo-data/data_sources.rst b/docs/user-guide/fetching-argo-data/data_sources.rst
index 650f076b..fdb86c5a 100644
--- a/docs/user-guide/fetching-argo-data/data_sources.rst
+++ b/docs/user-guide/fetching-argo-data/data_sources.rst
@@ -147,27 +147,27 @@ capabilities. Here is a summary:
       -
       -
     * -
-      - 🟡 core (T/S)
+      - core (T/S)
       - X
       - X
       - X
     * -
-      - 🟢 BGC
+      - BGC
       - X
       - X
       -
     * -
-      - 🔵 Deep
+      - Deep
       - X
       - X
       - X
     * -
-      - ⚫ Trajectories
+      - Trajectories
       -
       -
       -
     * -
-      - 🟣 Reference data for DMQC
+      - Reference data for DMQC
       - X
       -
       -
diff --git a/docs/user-guide/fetching-argo-data/user_mode.rst b/docs/user-guide/fetching-argo-data/user_mode.rst
index 32ef7289..fa1df7b8 100644
--- a/docs/user-guide/fetching-argo-data/user_mode.rst
+++ b/docs/user-guide/fetching-argo-data/user_mode.rst
@@ -84,7 +84,7 @@ The **research** mode is the safer choice, with data of the highest quality, car
       - all without jargon (DATA_MODE and QC_FLAG are retained)
       - comprehensive minimum
 
-.. admonition:: About the 🟢 **bgc** dataset
+.. admonition:: About the **bgc** dataset
 
     The table of **argopy** user mode data processing details for **biogeochemical** parameters is being defined (:issue:`280`) and will be implemented in a near future release.
 
diff --git a/docs/user-guide/working-with-argo-data/visualisation.rst b/docs/user-guide/working-with-argo-data/visualisation.rst
index ac37faa4..d07a24e1 100644
--- a/docs/user-guide/working-with-argo-data/visualisation.rst
+++ b/docs/user-guide/working-with-argo-data/visualisation.rst
@@ -111,7 +111,7 @@ Examples:
 
         .. image:: ../../_static/dashboard_profile.png
 
-    .. tab:: For 🟢 **bgc** profiles
+    .. tab:: For **bgc** profiles
 
         and for a BGC float, change the ``type`` option to ``bgc``:
 
diff --git a/docs/whats-new.rst b/docs/whats-new.rst
index 623cfa95..427bd7f1 100644
--- a/docs/whats-new.rst
+++ b/docs/whats-new.rst
@@ -10,6 +10,9 @@ What's New
 
 Coming up next
 --------------
+**Features and front-end API**
+
+- Rolling out incremental support for BGC variables 🎉 All new features from v0.1.14rc2 and v0.1.14rc1 ! See below ...
 
 **Internals**
 
@@ -84,7 +87,7 @@ v0.1.14rc2 (27 Jul. 2023)
 
 - Refactor pickle files in argopy/assets as json files in argopy/static/assets
 
-- Refactor list of variables by data types used in :func:`utils.cast_Argo_variable_type` into assets json files in argopy/static/assets
+- Refactor list of variables by data types used in :func:`related.cast_Argo_variable_type` into assets json files in argopy/static/assets
 
 - Change of behaviour: when setting the cachedir option, path it's not tested for existence but for being writable, and is created if doesn't exists (but seems to break CI upstream in Windows)
 
@@ -147,7 +150,7 @@ v0.1.14rc1 (31 May 2023)
 .. warning::
     **argopy** is ready but the Argo CTD reference database for DMQC is not fully published on the Ifremer ERDDAP yet. This new feature will thus be fully operational soon, and while it's not, **argopy** should raise an ``ErddapHTTPNotFound`` error when using the new fetcher.
 
-- New option to control the expiration time of cache file ``cache_expiration``. 
+- New option to control the expiration time of cache file: ``cache_expiration``.
 
 **Internals**
 

From 369f5fb513afa00e822b3cf731d22007673b01a7 Mon Sep 17 00:00:00 2001
From: Guillaume Maze <gmaze@ifremer.fr>
Date: Tue, 26 Sep 2023 11:35:16 +0200
Subject: [PATCH 33/33] Update data_sources.rst

---
 .../fetching-argo-data/data_sources.rst       | 54 +++++++++++--------
 1 file changed, 31 insertions(+), 23 deletions(-)

diff --git a/docs/user-guide/fetching-argo-data/data_sources.rst b/docs/user-guide/fetching-argo-data/data_sources.rst
index fdb86c5a..28752819 100644
--- a/docs/user-guide/fetching-argo-data/data_sources.rst
+++ b/docs/user-guide/fetching-argo-data/data_sources.rst
@@ -181,37 +181,45 @@ Fetched data and variables
 | This will depend on the last update of each data sources and of your
   local data.
 
-Let's retrieve one float data from a local sample of the GDAC ftp (a sample GDAC ftp is downloaded automatically with the method :meth:`argopy.tutorial.open_dataset`):
+.. tabs::
 
-.. ipython:: python
-    :okwarning:
+    .. tab:: **GDAC** ftp
 
-    # Download ftp sample and get the ftp local path:
-    ftproot = argopy.tutorial.open_dataset('gdac')[0]
-    
-    # then fetch data:
-    with argopy.set_options(src='gdac', ftp=ftproot):
-        ds = ArgoDataFetcher().float(1900857).load().data
-        print(ds)
+        Let's retrieve one float data from a local sample of the GDAC ftp (a sample GDAC ftp is downloaded automatically with the method :meth:`argopy.tutorial.open_dataset`):
 
-Let’s now retrieve the latest data for this float from the ``erddap`` and ``argovis`` sources:
+        .. ipython:: python
+            :okwarning:
 
-.. ipython:: python
-    :okwarning:
+            # Download ftp sample and get the ftp local path:
+            ftproot = argopy.tutorial.open_dataset('gdac')[0]
 
-    with argopy.set_options(src='erddap'):
-        ds = ArgoDataFetcher().float(1900857).load().data
-        print(ds)
+            # then fetch data:
+            with argopy.set_options(src='gdac', ftp=ftproot):
+                ds = ArgoDataFetcher().float(1900857).load().data
+                print(ds)
 
-.. ipython:: python
-    :okwarning:
+    .. tab:: **erddap**
+
+        Let’s now retrieve the latest data for this float from the ``erddap``:
+
+        .. ipython:: python
+            :okwarning:
+
+            with argopy.set_options(src='erddap'):
+                ds = ArgoDataFetcher().float(1900857).load().data
+                print(ds)
+
+    .. tab:: **argovis**
+
+        And with ``argovis``:
+
+        .. ipython:: python
+            :okwarning:
 
-    with argopy.set_options(src='argovis'):
-        ds = ArgoDataFetcher().float(1900857).load().data
-        print(ds)
+            with argopy.set_options(src='argovis'):
+                ds = ArgoDataFetcher().float(1900857).load().data
+                print(ds)
 
-We can see some minor differences between ``gdac``/``erddap`` vs the
-``argovis`` response.
 
 .. _api-status: