From 9d09ff9658c4fdf958a80253d60bfb1e8cbfa365 Mon Sep 17 00:00:00 2001 From: Rachel Wegener Date: Tue, 1 Aug 2023 17:07:58 +0000 Subject: [PATCH 01/30] mvp remove intake from Read --- icepyx/core/read.py | 51 ++++++++++++++++++++++++--------------------- 1 file changed, 27 insertions(+), 24 deletions(-) diff --git a/icepyx/core/read.py b/icepyx/core/read.py index 5a497279a..5860e32dc 100644 --- a/icepyx/core/read.py +++ b/icepyx/core/read.py @@ -4,6 +4,7 @@ import numpy as np import xarray as xr +import h5py import icepyx.core.is2cat as is2cat import icepyx.core.is2ref as is2ref @@ -258,7 +259,7 @@ def __init__( catalog=None, out_obj_type=None, # xr.Dataset, ): - + # Note: maybe just don't add default values, so that Python enforces their existence? if data_source is None: raise ValueError("Please provide a data source.") else: @@ -271,10 +272,16 @@ def __init__( ) else: self._prod = is2ref._validate_product(product) - + + # TODO delete? seems like it just validates the pattern + # Does Read accept a directory right now? Why would there be multiple files in the list? + # seems like yes, it does accept a directory + # does it check, then, that all the files have the same version and product? pattern_ck, filelist = Read._check_source_for_pattern( data_source, filename_pattern ) + print('pattern_ck', pattern_ck) + print('filelist', filelist) assert pattern_ck # Note: need to check if this works for subset and non-subset NSIDC files (processed_ prepends the former) self._pattern = filename_pattern @@ -282,7 +289,8 @@ def __init__( # this is a first pass at getting rid of mixed product types and warning the user. # it takes an approach assuming the product name is in the filename, but needs reworking if we let multiple products be loaded # one way to handle this would be bring in the product info during the loading step and fill in product there instead of requiring it from the user - filtered_filelist = [file for file in filelist if self._prod in file] + filtered_filelist = [file for file in filelist if self._prod in Read._get_product_and_version(file)] + print('filtered', filtered_filelist) if len(filtered_filelist) == 0: warnings.warn( "Your filenames do not contain a product identifier (e.g. ATL06). " @@ -665,6 +673,13 @@ def _build_dataset_template(self, file): attrs=dict(data_product=self._prod), ) return is2ds + + def _get_product_and_version(filepath): + # TODO either persist this info or remove 'version', since it isn't necessary right now + with h5py.File(filepath, 'r') as f: + product = f['METADATA']['DatasetIdentification'].attrs['shortName'].decode() + version = f['METADATA']['DatasetIdentification'].attrs['VersionID'].decode() + return product, version def _read_single_grp(self, file, grp_path): """ @@ -684,25 +699,10 @@ def _read_single_grp(self, file, grp_path): Xarray dataset with the specified group. """ - - try: - grpcat = is2cat.build_catalog( - file, self._pattern, self._source_type, grp_paths=grp_path - ) - ds = grpcat[self._source_type].read() - - # NOTE: could also do this with h5py, but then would have to read in each variable in the group separately - except ValueError: - grpcat = is2cat.build_catalog( - file, - self._pattern, - self._source_type, - grp_paths=grp_path, - extra_engine_kwargs={"phony_dims": "access"}, - ) - ds = grpcat[self._source_type].read() - - return ds + # I think this would fail if a group that has too high of a level of nesting + # is given. Consider this. + # TODO: update docstring + return xr.open_dataset(file, group=grp_path) def _build_single_file_dataset(self, file, groups_list): """ @@ -722,8 +722,11 @@ def _build_single_file_dataset(self, file, groups_list): ------- Xarray Dataset """ - - file_product = self._read_single_grp(file, "/").attrs["identifier_product_type"] + # why do we do get the product twice? is it important to us that the user tells us + # correctly their product? Do we trust the metadata or the filename more? + # Also revisit the semantics of this. Not sure if it makes semantic sense for this + # to be a class method + file_product, _ = Read._get_product_and_version(file) assert ( file_product == self._prod ), "Your product specification does not match the product specification within your files." From 24f6a42df3b06bf93e2f16e90434a70aef5d4b1c Mon Sep 17 00:00:00 2001 From: Rachel Wegener Date: Tue, 29 Aug 2023 15:58:03 +0000 Subject: [PATCH 02/30] delete is2cat and references --- icepyx/core/is2cat.py | 178 ------------------------------------------ icepyx/core/read.py | 78 +++++++++++------- 2 files changed, 51 insertions(+), 205 deletions(-) delete mode 100644 icepyx/core/is2cat.py diff --git a/icepyx/core/is2cat.py b/icepyx/core/is2cat.py deleted file mode 100644 index f4e66a7bf..000000000 --- a/icepyx/core/is2cat.py +++ /dev/null @@ -1,178 +0,0 @@ -from intake.catalog import Catalog - -# Need to post on intake's page to see if this would be a useful contribution... -# https://github.com/intake/intake/blob/0.6.4/intake/source/utils.py#L216 -def _pattern_to_glob(pattern): - """ - Adapted from intake.source.utils.path_to_glob to convert a path as pattern into a glob style path - that uses the pattern's indicated number of '?' instead of '*' where an int was specified. - - Returns pattern if pattern is not a string. - - Parameters - ---------- - pattern : str - Path as pattern optionally containing format_strings - - Returns - ------- - glob_path : str - Path with int format strings replaced with the proper number of '?' and '*' otherwise. - - Examples - -------- - >>> _pattern_to_glob('{year}/{month}/{day}.csv') - '*/*/*.csv' - >>> _pattern_to_glob('{year:4}/{month:2}/{day:2}.csv') - '????/??/??.csv' - >>> _pattern_to_glob('data/{year:4}{month:02}{day:02}.csv') - 'data/????????.csv' - >>> _pattern_to_glob('data/*.csv') - 'data/*.csv' - """ - from string import Formatter - - if not isinstance(pattern, str): - return pattern - - fmt = Formatter() - glob_path = "" - # prev_field_name = None - for literal_text, field_name, format_specs, _ in fmt.parse(format_string=pattern): - glob_path += literal_text - if field_name and (glob_path != "*"): - try: - glob_path += "?" * int(format_specs) - except ValueError: - glob_path += "*" - # alternatively, you could use bits=utils._get_parts_of_format_string(resolved_string, literal_texts, format_specs) - # and then use len(bits[i]) to get the length of each format_spec - # print(glob_path) - return glob_path - - -def build_catalog( - data_source, - path_pattern, - source_type, - grp_paths=None, - grp_path_params=None, - extra_engine_kwargs=None, - **kwargs -): - """ - Build a general Intake catalog for reading in ICESat-2 data. - This function is used by the read class object to create catalogs from lists of ICESat-2 variables. - - Parameters - ---------- - data_source : string - A string with a full file path or full directory path to ICESat-2 hdf5 (.h5) format files. - Files within a directory must have a consistent filename pattern that includes the "ATL??" data product name. - Files must all be within a single directory. - - path_pattern : string - String that shows the filename pattern as required for Intake's path_as_pattern argument. - - source_type : string - String to use as the Local Catalog Entry name. - - grp_paths : str, default None - Variable paths to load. - Can include general parameter names, which must be contained within double curly brackets and further - described in `grp_path_params`. - Default list based on data product of provided files. - If multiple data products are included in the files, the default list will be for the product of the first file. - This may result in errors during read-in if all files do not have the same variable paths. - - grp_path_params : [dict], default None - List of dictionaries with a keyword for each parameter name specified in the `grp_paths` string. - Each parameter keyword should contain a dictionary with the acceptable keyword-value pairs for the driver being used. - - **kwargs : - Keyword arguments to be passed through to `intake.catalog.Catalog.from_dict()`. - Keywords needed to override default inputs include: - - `source_args_dict` # highest level source information; keys include: "urlpath", "path_as_pattern", driver-specific ("xarray_kwargs" is default) - - `metadata_dict` - - `source_dict` # individual source entry information (default is supplied by data object; "name", "description", "driver", "args") - - `defaults_dict` # catalog "name", "description", "metadata", "entries", etc. - - Returns - ------- - intake.catalog.Catalog object - - See Also - -------- - read.Read - - """ - from intake.catalog.local import LocalCatalogEntry, UserParameter - import intake_xarray - - import icepyx.core.APIformatting as apifmt - - assert ( - grp_paths - ), "You must enter a variable path or you will not be able to read in any data." - - # generalize this/make it so the [engine] values can be entered as kwargs... - engine_key = "xarray_kwargs" - xarray_kwargs_dict = {"engine": "h5netcdf", "group": grp_paths} - if extra_engine_kwargs: - for key in extra_engine_kwargs.keys(): - xarray_kwargs_dict[key] = extra_engine_kwargs[key] - - source_args_dict = { - "urlpath": data_source, - "path_as_pattern": path_pattern, - engine_key: xarray_kwargs_dict, - } - - metadata_dict = {"version": 1} - - source_dict = { - "name": source_type, - "description": "", - "driver": "intake_xarray.netcdf.NetCDFSource", # NOTE: this must be a string or the catalog cannot be imported after saving - "args": source_args_dict, - } - - if grp_path_params: - source_dict = apifmt.combine_params( - source_dict, - {"parameters": [UserParameter(**params) for params in grp_path_params]}, - ) - - # NOTE: LocalCatalogEntry has some required positional args (name, description, driver) - # I tried doing this generally with *source_dict after the positional args (instead of as part of the if) - # but apparently I don't quite get something about passing dicts with * and ** and couldn't make it work - local_cat_source = { - source_type: LocalCatalogEntry( - name=source_dict.pop("name"), - description=source_dict.pop("description"), - driver=source_dict.pop("driver"), - parameters=source_dict.pop("parameters"), - args=source_dict.pop("args"), - ) - } - - else: - local_cat_source = { - source_type: LocalCatalogEntry( - name=source_dict.pop("name"), - description=source_dict.pop("description"), - driver=source_dict.pop("driver"), - args=source_dict.pop("args"), - ) - } - - defaults_dict = { - "name": "IS2-hdf5-icepyx-intake-catalog", - "description": "an icepyx-generated catalog for creating local ICESat-2 intake entries", - "metadata": metadata_dict, - "entries": local_cat_source, - } - - build_cat_dict = apifmt.combine_params(defaults_dict, kwargs) - - return Catalog.from_dict(**build_cat_dict) diff --git a/icepyx/core/read.py b/icepyx/core/read.py index 5860e32dc..c4c10b296 100644 --- a/icepyx/core/read.py +++ b/icepyx/core/read.py @@ -6,7 +6,6 @@ import xarray as xr import h5py -import icepyx.core.is2cat as is2cat import icepyx.core.is2ref as is2ref from icepyx.core.variables import Variables as Variables from icepyx.core.variables import list_of_dict_vals @@ -207,6 +206,56 @@ def _run_fast_scandir(dir, fn_glob): return subfolders, files +# Need to post on intake's page to see if this would be a useful contribution... +# https://github.com/intake/intake/blob/0.6.4/intake/source/utils.py#L216 +def _pattern_to_glob(pattern): + """ + Adapted from intake.source.utils.path_to_glob to convert a path as pattern into a glob style path + that uses the pattern's indicated number of '?' instead of '*' where an int was specified. + + Returns pattern if pattern is not a string. + + Parameters + ---------- + pattern : str + Path as pattern optionally containing format_strings + + Returns + ------- + glob_path : str + Path with int format strings replaced with the proper number of '?' and '*' otherwise. + + Examples + -------- + >>> _pattern_to_glob('{year}/{month}/{day}.csv') + '*/*/*.csv' + >>> _pattern_to_glob('{year:4}/{month:2}/{day:2}.csv') + '????/??/??.csv' + >>> _pattern_to_glob('data/{year:4}{month:02}{day:02}.csv') + 'data/????????.csv' + >>> _pattern_to_glob('data/*.csv') + 'data/*.csv' + """ + from string import Formatter + + if not isinstance(pattern, str): + return pattern + + fmt = Formatter() + glob_path = "" + # prev_field_name = None + for literal_text, field_name, format_specs, _ in fmt.parse(format_string=pattern): + glob_path += literal_text + if field_name and (glob_path != "*"): + try: + glob_path += "?" * int(format_specs) + except ValueError: + glob_path += "*" + # alternatively, you could use bits=utils._get_parts_of_format_string(resolved_string, literal_texts, format_specs) + # and then use len(bits[i]) to get the length of each format_spec + # print(glob_path) + return glob_path + # To do: test this class and functions therein class Read: @@ -322,28 +371,6 @@ def __init__( # ---------------------------------------------------------------------- # Properties - @property - def is2catalog(self): - """ - Print a generic ICESat-2 Intake catalog. - This catalog does not specify groups, so it cannot be used to read in data. - - """ - if not hasattr(self, "_is2catalog") and hasattr(self, "_catalog_path"): - from intake import open_catalog - - self._is2catalog = open_catalog(self._catalog_path) - - else: - self._is2catalog = is2cat.build_catalog( - self.data_source, - self._pattern, - self._source_type, - grp_paths="/paths/to/variables", - ) - - return self._is2catalog - # I cut and pasted this directly out of the Query class - going to need to reconcile the _source/file stuff there @property @@ -378,7 +405,7 @@ def _check_source_for_pattern(source, filename_pattern): """ Check that the entered data source contains files that match the input filename_pattern """ - glob_pattern = is2cat._pattern_to_glob(filename_pattern) + glob_pattern = _pattern_to_glob(filename_pattern) if os.path.isdir(source): _, filelist = _run_fast_scandir(source, glob_pattern) @@ -609,9 +636,6 @@ def load(self): All items in the wanted variables list will be loaded from the files into memory. If you do not provide a wanted variables list, a default one will be created for you. - - If you would like to use the Intake catalog you provided to read in a single data variable, - simply call Intake's `read()` function on the is2catalog property (e.g. `reader.is2catalog.read()`). """ # todo: From b13b8473644589445c79144f6e53a21b7447c383 Mon Sep 17 00:00:00 2001 From: Rachel Wegener Date: Wed, 30 Aug 2023 20:06:14 +0000 Subject: [PATCH 03/30] remove extra comments --- icepyx/core/read.py | 33 ++++++--------------------------- 1 file changed, 6 insertions(+), 27 deletions(-) diff --git a/icepyx/core/read.py b/icepyx/core/read.py index c4c10b296..f272a3aa4 100644 --- a/icepyx/core/read.py +++ b/icepyx/core/read.py @@ -305,7 +305,6 @@ def __init__( data_source=None, product=None, filename_pattern="ATL{product:2}_{datetime:%Y%m%d%H%M%S}_{rgt:4}{cycle:2}{orbitsegment:2}_{version:3}_{revision:2}.h5", - catalog=None, out_obj_type=None, # xr.Dataset, ): # Note: maybe just don't add default values, so that Python enforces their existence? @@ -322,15 +321,9 @@ def __init__( else: self._prod = is2ref._validate_product(product) - # TODO delete? seems like it just validates the pattern - # Does Read accept a directory right now? Why would there be multiple files in the list? - # seems like yes, it does accept a directory - # does it check, then, that all the files have the same version and product? pattern_ck, filelist = Read._check_source_for_pattern( data_source, filename_pattern ) - print('pattern_ck', pattern_ck) - print('filelist', filelist) assert pattern_ck # Note: need to check if this works for subset and non-subset NSIDC files (processed_ prepends the former) self._pattern = filename_pattern @@ -338,8 +331,7 @@ def __init__( # this is a first pass at getting rid of mixed product types and warning the user. # it takes an approach assuming the product name is in the filename, but needs reworking if we let multiple products be loaded # one way to handle this would be bring in the product info during the loading step and fill in product there instead of requiring it from the user - filtered_filelist = [file for file in filelist if self._prod in Read._get_product_and_version(file)] - print('filtered', filtered_filelist) + filtered_filelist = [file for file in filelist if self._prod in file] if len(filtered_filelist) == 0: warnings.warn( "Your filenames do not contain a product identifier (e.g. ATL06). " @@ -355,11 +347,6 @@ def __init__( self._filelist = filelist # after validation, use the notebook code and code outline to start implementing the rest of the class - if catalog is not None: - assert os.path.isfile( - catalog - ), f"Your catalog path '{catalog}' does not point to a valid file." - self._catalog_path = catalog if out_obj_type is not None: print( @@ -697,17 +684,10 @@ def _build_dataset_template(self, file): attrs=dict(data_product=self._prod), ) return is2ds - - def _get_product_and_version(filepath): - # TODO either persist this info or remove 'version', since it isn't necessary right now - with h5py.File(filepath, 'r') as f: - product = f['METADATA']['DatasetIdentification'].attrs['shortName'].decode() - version = f['METADATA']['DatasetIdentification'].attrs['VersionID'].decode() - return product, version def _read_single_grp(self, file, grp_path): """ - For a given file and variable group path, construct an Intake catalog and use it to read in the data. + For a given file and variable group path, construct an an xarray Dataset. Parameters ---------- @@ -723,10 +703,9 @@ def _read_single_grp(self, file, grp_path): Xarray dataset with the specified group. """ - # I think this would fail if a group that has too high of a level of nesting - # is given. Consider this. - # TODO: update docstring - return xr.open_dataset(file, group=grp_path) + + return xr.open_dataset(file, group=grp_path, engine='h5netcdf', + backend_kwargs={'phony_dims': 'access'}) def _build_single_file_dataset(self, file, groups_list): """ @@ -750,7 +729,7 @@ def _build_single_file_dataset(self, file, groups_list): # correctly their product? Do we trust the metadata or the filename more? # Also revisit the semantics of this. Not sure if it makes semantic sense for this # to be a class method - file_product, _ = Read._get_product_and_version(file) + file_product = self._read_single_grp(file, "/").attrs["identifier_product_type"] assert ( file_product == self._prod ), "Your product specification does not match the product specification within your files." From 0779b8017a98ac3f2e683fddcaaebc0ca413ceac Mon Sep 17 00:00:00 2001 From: Rachel Wegener Date: Wed, 30 Aug 2023 20:23:45 +0000 Subject: [PATCH 04/30] update doc strings --- icepyx/core/read.py | 13 +------------ 1 file changed, 1 insertion(+), 12 deletions(-) diff --git a/icepyx/core/read.py b/icepyx/core/read.py index f272a3aa4..d3ca0d82a 100644 --- a/icepyx/core/read.py +++ b/icepyx/core/read.py @@ -4,7 +4,6 @@ import numpy as np import xarray as xr -import h5py import icepyx.core.is2ref as is2ref from icepyx.core.variables import Variables as Variables @@ -260,7 +259,7 @@ def _pattern_to_glob(pattern): # To do: test this class and functions therein class Read: """ - Data object to create and use Intake catalogs to read ICESat-2 data into the specified formats. + Data object to read ICESat-2 data into the specified formats. Provides flexiblity for reading nested hdf5 files into common analysis formats. Parameters @@ -279,10 +278,6 @@ class Read: The default describes files downloaded directly from NSIDC (subsetted and non-subsetted) for most products (e.g. ATL06). The ATL11 filename pattern from NSIDC is: 'ATL{product:2}_{rgt:4}{orbitsegment:2}_{cycles:4}_{version:3}_{revision:2}.h5'. - catalog : string, default None - Full path to an Intake catalog for reading in data. - If you still need to create a catalog, leave as default. - out_obj_type : object, default xarray.Dataset The desired format for the data to be read in. Currently, only xarray.Dataset objects (default) are available. @@ -307,7 +302,6 @@ def __init__( filename_pattern="ATL{product:2}_{datetime:%Y%m%d%H%M%S}_{rgt:4}{cycle:2}{orbitsegment:2}_{version:3}_{revision:2}.h5", out_obj_type=None, # xr.Dataset, ): - # Note: maybe just don't add default values, so that Python enforces their existence? if data_source is None: raise ValueError("Please provide a data source.") else: @@ -320,7 +314,6 @@ def __init__( ) else: self._prod = is2ref._validate_product(product) - pattern_ck, filelist = Read._check_source_for_pattern( data_source, filename_pattern ) @@ -725,10 +718,6 @@ def _build_single_file_dataset(self, file, groups_list): ------- Xarray Dataset """ - # why do we do get the product twice? is it important to us that the user tells us - # correctly their product? Do we trust the metadata or the filename more? - # Also revisit the semantics of this. Not sure if it makes semantic sense for this - # to be a class method file_product = self._read_single_grp(file, "/").attrs["identifier_product_type"] assert ( file_product == self._prod From 1cfbf7208a8de80a1539d25e0c536f6831330c25 Mon Sep 17 00:00:00 2001 From: Rachel Wegener Date: Wed, 30 Aug 2023 20:24:00 +0000 Subject: [PATCH 05/30] update tests --- icepyx/tests/test_read.py | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/icepyx/tests/test_read.py b/icepyx/tests/test_read.py index 9748ae992..018435968 100644 --- a/icepyx/tests/test_read.py +++ b/icepyx/tests/test_read.py @@ -63,7 +63,6 @@ def test_validate_source_str_not_a_dir_or_file(): ), sorted( [ - "./icepyx/core/is2cat.py", "./icepyx/core/is2ref.py", "./icepyx/tests/is2class_query.py", ] @@ -73,7 +72,7 @@ def test_validate_source_str_not_a_dir_or_file(): ( "./icepyx/core", "is2*.py", - ([], ["./icepyx/core/is2cat.py", "./icepyx/core/is2ref.py"]), + ([], ["./icepyx/core/is2ref.py"]), ), ( "./icepyx", From de61d87e21ccb4e1feb0e289b83a66ffc1690566 Mon Sep 17 00:00:00 2001 From: Rachel Wegener Date: Wed, 30 Aug 2023 20:43:07 +0000 Subject: [PATCH 06/30] update documentation for removing intake --- .../example_notebooks/IS2_data_read-in.ipynb | 2268 +++++++++++++++-- doc/source/user_guide/documentation/read.rst | 1 - 2 files changed, 2052 insertions(+), 217 deletions(-) diff --git a/doc/source/example_notebooks/IS2_data_read-in.ipynb b/doc/source/example_notebooks/IS2_data_read-in.ipynb index dc9d8ed31..b8697b1d7 100644 --- a/doc/source/example_notebooks/IS2_data_read-in.ipynb +++ b/doc/source/example_notebooks/IS2_data_read-in.ipynb @@ -3,7 +3,9 @@ { "cell_type": "markdown", "id": "552e9ef9", - "metadata": {}, + "metadata": { + "user_expressions": [] + }, "source": [ "# Reading ICESat-2 Data in for Analysis\n", "This notebook ({nb-download}`download `) illustrates the use of icepyx for reading ICESat-2 data files, loading them into a data object.\n", @@ -36,7 +38,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 4, "id": "2b74b672", "metadata": {}, "outputs": [], @@ -47,7 +49,9 @@ { "cell_type": "markdown", "id": "1ffb9a0c", - "metadata": {}, + "metadata": { + "user_expressions": [] + }, "source": [ "---------------------------------\n", "\n", @@ -57,10 +61,18 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 5, "id": "c4390195", "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "You have 6 files matching the filename pattern to be read in.\n" + ] + } + ], "source": [ "path_root = '/full/path/to/your/data/'\n", "pattern = \"processed_ATL{product:2}_{datetime:%Y%m%d%H%M%S}_{rgt:4}{cycle:2}{orbitsegment:2}_{version:3}_{revision:2}.h5\"\n", @@ -69,7 +81,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 6, "id": "2f46029d", "metadata": {}, "outputs": [], @@ -79,10 +91,603 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 7, "id": "c0439388", "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", + " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", + " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", + " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", + " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", + " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", + " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", + " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", + " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", + " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", + " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", + " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", + " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n" + ] + }, + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "
<xarray.Dataset>\n",
+       "Dimensions:              (photon_idx: 29027, spot: 2, gran_idx: 6)\n",
+       "Coordinates:\n",
+       "  * photon_idx           (photon_idx) int64 0 1 2 3 ... 29023 29024 29025 29026\n",
+       "  * spot                 (spot) uint8 2 5\n",
+       "  * gran_idx             (gran_idx) float64 8.49e+04 9.02e+04 ... 1.016e+05\n",
+       "    source_file          (gran_idx) <U72 '../../../../data/ATL06/processed_AT...\n",
+       "    delta_time           (gran_idx, photon_idx) datetime64[ns] 2019-02-22T01:...\n",
+       "Data variables:\n",
+       "    sc_orient            (gran_idx) int8 0 0 0 1 1 1\n",
+       "    cycle_number         (gran_idx) int8 2 2 2 5 5 5\n",
+       "    rgt                  (gran_idx) int16 849 902 910 986 1001 1016\n",
+       "    atlas_sdp_gps_epoch  (gran_idx) datetime64[ns] 2018-01-01T00:00:18 ... 20...\n",
+       "    data_start_utc       (gran_idx) datetime64[ns] 2019-02-22T01:03:44.199777...\n",
+       "    data_end_utc         (gran_idx) datetime64[ns] 2019-02-22T01:07:38.112326...\n",
+       "    h_li                 (spot, gran_idx, photon_idx) float32 nan nan ... nan\n",
+       "    latitude             (spot, gran_idx, photon_idx) float64 nan nan ... nan\n",
+       "    longitude            (spot, gran_idx, photon_idx) float64 nan nan ... nan\n",
+       "    gt                   (gran_idx, spot) <U4 'gt3r' 'gt1l' ... 'gt1l' 'gt3r'\n",
+       "Attributes:\n",
+       "    data_product:  ATL06\n",
+       "    Description:   The land_ice_height group contains the primary set of deri...\n",
+       "    data_rate:     Data within this group are sparse.  Data values are provid...
" + ], + "text/plain": [ + "\n", + "Dimensions: (photon_idx: 29027, spot: 2, gran_idx: 6)\n", + "Coordinates:\n", + " * photon_idx (photon_idx) int64 0 1 2 3 ... 29023 29024 29025 29026\n", + " * spot (spot) uint8 2 5\n", + " * gran_idx (gran_idx) float64 8.49e+04 9.02e+04 ... 1.016e+05\n", + " source_file (gran_idx) " + ] + }, + "execution_count": 8, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], "source": [ "ds.plot.scatter(x=\"longitude\", y=\"latitude\", hue=\"h_li\", vmin=-100, vmax=2000)" ] @@ -101,7 +727,9 @@ { "cell_type": "markdown", "id": "b8875936", - "metadata": {}, + "metadata": { + "user_expressions": [] + }, "source": [ "---------------------------------------\n", "## Key steps for loading (reading) ICESat-2 data\n", @@ -119,7 +747,9 @@ { "cell_type": "markdown", "id": "9bf6d38c", - "metadata": {}, + "metadata": { + "user_expressions": [] + }, "source": [ "### Step 0: Get some data if you haven't already\n", "Here are a few lines of code to get you set up with a few data files if you don't already have some on your local system." @@ -127,7 +757,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 9, "id": "63da2b3c", "metadata": {}, "outputs": [], @@ -138,10 +768,24 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 10, "id": "e6f7c047", "metadata": {}, - "outputs": [], + "outputs": [ + { + "ename": "AttributeError", + "evalue": "'Query' object has no attribute '_session'", + "output_type": "error", + "traceback": [ + "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", + "\u001b[0;31mAttributeError\u001b[0m Traceback (most recent call last)", + "Cell \u001b[0;32mIn[10], line 1\u001b[0m\n\u001b[0;32m----> 1\u001b[0m \u001b[43mregion_a\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mdownload_granules\u001b[49m\u001b[43m(\u001b[49m\u001b[43mpath\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mpath_root\u001b[49m\u001b[43m)\u001b[49m\n", + "File \u001b[0;32m~/envs/general/lib/python3.11/site-packages/icepyx/core/query.py:1129\u001b[0m, in \u001b[0;36mQuery.download_granules\u001b[0;34m(self, path, verbose, subset, restart, **kwargs)\u001b[0m\n\u001b[1;32m 1124\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[1;32m 1125\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m (\n\u001b[1;32m 1126\u001b[0m \u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;28mhasattr\u001b[39m(\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_granules, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124morderIDs\u001b[39m\u001b[38;5;124m\"\u001b[39m)\n\u001b[1;32m 1127\u001b[0m \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;28mlen\u001b[39m(\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_granules\u001b[38;5;241m.\u001b[39morderIDs) \u001b[38;5;241m==\u001b[39m \u001b[38;5;241m0\u001b[39m\n\u001b[1;32m 1128\u001b[0m ):\n\u001b[0;32m-> 1129\u001b[0m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43morder_granules\u001b[49m\u001b[43m(\u001b[49m\u001b[43mverbose\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mverbose\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43msubset\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43msubset\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 1131\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_granules\u001b[38;5;241m.\u001b[39mdownload(verbose, path, session\u001b[38;5;241m=\u001b[39m\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_session, restart\u001b[38;5;241m=\u001b[39mrestart)\n", + "File \u001b[0;32m~/envs/general/lib/python3.11/site-packages/icepyx/core/query.py:1065\u001b[0m, in \u001b[0;36mQuery.order_granules\u001b[0;34m(self, verbose, subset, email, **kwargs)\u001b[0m\n\u001b[1;32m 1048\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_granules\u001b[38;5;241m.\u001b[39mplace_order(\n\u001b[1;32m 1049\u001b[0m tempCMRparams,\n\u001b[1;32m 1050\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mreqparams,\n\u001b[0;32m (...)\u001b[0m\n\u001b[1;32m 1055\u001b[0m geom_filepath\u001b[38;5;241m=\u001b[39m\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_spatial\u001b[38;5;241m.\u001b[39m_geom_file,\n\u001b[1;32m 1056\u001b[0m )\n\u001b[1;32m 1058\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[1;32m 1059\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_granules\u001b[38;5;241m.\u001b[39mplace_order(\n\u001b[1;32m 1060\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mCMRparams,\n\u001b[1;32m 1061\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mreqparams,\n\u001b[1;32m 1062\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39msubsetparams(\u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs),\n\u001b[1;32m 1063\u001b[0m verbose,\n\u001b[1;32m 1064\u001b[0m subset,\n\u001b[0;32m-> 1065\u001b[0m session\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_session\u001b[49m,\n\u001b[1;32m 1066\u001b[0m geom_filepath\u001b[38;5;241m=\u001b[39m\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_spatial\u001b[38;5;241m.\u001b[39m_geom_file,\n\u001b[1;32m 1067\u001b[0m )\n", + "\u001b[0;31mAttributeError\u001b[0m: 'Query' object has no attribute '_session'" + ] + } + ], "source": [ "region_a.download_granules(path=path_root)" ] @@ -182,7 +826,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 11, "id": "9cde6679", "metadata": {}, "outputs": [], @@ -192,7 +836,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 13, "id": "8b6edf0c", "metadata": {}, "outputs": [], @@ -202,7 +846,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 14, "id": "e683ebf7", "metadata": {}, "outputs": [], @@ -213,7 +857,9 @@ { "cell_type": "markdown", "id": "92743496", - "metadata": {}, + "metadata": { + "user_expressions": [] + }, "source": [ "### Step 2: Create a filename pattern for your data files\n", "\n", @@ -227,7 +873,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 15, "id": "7318abd0", "metadata": {}, "outputs": [], @@ -238,7 +884,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 16, "id": "f43e8664", "metadata": {}, "outputs": [], @@ -248,7 +894,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 17, "id": "992a77fb", "metadata": {}, "outputs": [], @@ -258,7 +904,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 18, "id": "6aec1a70", "metadata": {}, "outputs": [], @@ -269,7 +915,9 @@ { "cell_type": "markdown", "id": "4275b04c", - "metadata": {}, + "metadata": { + "user_expressions": [] + }, "source": [ "### Step 3: Create an icepyx read object\n", "\n", @@ -277,29 +925,52 @@ "- `path` = a string with the full file path or full directory path to your hdf5 (.h5) format files.\n", "- `product` = the data product you're working with, also known as the \"short name\".\n", "\n", - "The `Read` object also accepts two optional keyword inputs:\n", - "- `pattern` = a formatted string indicating the filename pattern required for Intake's path_as_pattern argument.\n", - "- `catalog` = a string with the full path to an Intake catalog, for users who wish to use their own catalog (note this may have unintended consequenses if multiple granules are being combined)." + "The `Read` object also accepts the optional keyword input:\n", + "- `pattern` = a formatted string indicating the filename pattern required for Intake's path_as_pattern argument." ] }, { "cell_type": "code", - "execution_count": null, + "execution_count": 19, "id": "39bd7eb8", "metadata": { "scrolled": true }, - "outputs": [], + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "You have 6 files matching the filename pattern to be read in.\n" + ] + } + ], "source": [ "reader = ipx.Read(data_source=path_root, product=\"ATL06\", filename_pattern=pattern) # or ipx.Read(filepath, \"ATLXX\") if your filenames match the default pattern" ] }, { "cell_type": "code", - "execution_count": null, + "execution_count": 20, "id": "6c9ebc4a", "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "['../../../../data/ATL06/processed_ATL06_20190226005526_09100205_006_02.h5',\n", + " '../../../../data/ATL06/processed_ATL06_20191201105502_10010505_006_01.h5',\n", + " '../../../../data/ATL06/processed_ATL06_20190225121032_09020203_006_02.h5',\n", + " '../../../../data/ATL06/processed_ATL06_20190222010344_08490205_006_02.h5',\n", + " '../../../../data/ATL06/processed_ATL06_20191130112041_09860505_006_01.h5',\n", + " '../../../../data/ATL06/processed_ATL06_20191202102922_10160505_006_01.h5']" + ] + }, + "execution_count": 20, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "reader._filelist" ] @@ -307,7 +978,9 @@ { "cell_type": "markdown", "id": "da8d8024", - "metadata": {}, + "metadata": { + "user_expressions": [] + }, "source": [ "### Step 4: Specify variables to be read in\n", "\n", @@ -320,12 +993,616 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 21, "id": "18f65f67", "metadata": { "scrolled": true }, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "['ancillary_data/atlas_sdp_gps_epoch',\n", + " 'ancillary_data/control',\n", + " 'ancillary_data/data_end_utc',\n", + " 'ancillary_data/data_start_utc',\n", + " 'ancillary_data/end_cycle',\n", + " 'ancillary_data/end_delta_time',\n", + " 'ancillary_data/end_geoseg',\n", + " 'ancillary_data/end_gpssow',\n", + " 'ancillary_data/end_gpsweek',\n", + " 'ancillary_data/end_orbit',\n", + " 'ancillary_data/end_region',\n", + " 'ancillary_data/end_rgt',\n", + " 'ancillary_data/granule_end_utc',\n", + " 'ancillary_data/granule_start_utc',\n", + " 'ancillary_data/land_ice/dt_hist',\n", + " 'ancillary_data/land_ice/fit_maxiter',\n", + " 'ancillary_data/land_ice/fpb_maxiter',\n", + " 'ancillary_data/land_ice/max_res_ids',\n", + " 'ancillary_data/land_ice/min_dist',\n", + " 'ancillary_data/land_ice/min_gain_th',\n", + " 'ancillary_data/land_ice/min_n_pe',\n", + " 'ancillary_data/land_ice/min_n_sel',\n", + " 'ancillary_data/land_ice/min_signal_conf',\n", + " 'ancillary_data/land_ice/n_hist',\n", + " 'ancillary_data/land_ice/n_sigmas',\n", + " 'ancillary_data/land_ice/nhist_bins',\n", + " 'ancillary_data/land_ice/proc_interval',\n", + " 'ancillary_data/land_ice/qs_lim_bsc',\n", + " 'ancillary_data/land_ice/qs_lim_hrs',\n", + " 'ancillary_data/land_ice/qs_lim_hsigma',\n", + " 'ancillary_data/land_ice/qs_lim_msw',\n", + " 'ancillary_data/land_ice/qs_lim_snr',\n", + " 'ancillary_data/land_ice/qs_lim_sss',\n", + " 'ancillary_data/land_ice/rbin_width',\n", + " 'ancillary_data/land_ice/sigma_beam',\n", + " 'ancillary_data/land_ice/sigma_tx',\n", + " 'ancillary_data/land_ice/t_dead',\n", + " 'ancillary_data/land_ice/txp_maxiter',\n", + " 'ancillary_data/qa_at_interval',\n", + " 'ancillary_data/release',\n", + " 'ancillary_data/start_cycle',\n", + " 'ancillary_data/start_delta_time',\n", + " 'ancillary_data/start_geoseg',\n", + " 'ancillary_data/start_gpssow',\n", + " 'ancillary_data/start_gpsweek',\n", + " 'ancillary_data/start_orbit',\n", + " 'ancillary_data/start_region',\n", + " 'ancillary_data/start_rgt',\n", + " 'ancillary_data/version',\n", + " 'gt1l/land_ice_segments/atl06_quality_summary',\n", + " 'gt1l/land_ice_segments/bias_correction/fpb_mean_corr',\n", + " 'gt1l/land_ice_segments/bias_correction/fpb_mean_corr_sigma',\n", + " 'gt1l/land_ice_segments/bias_correction/fpb_med_corr',\n", + " 'gt1l/land_ice_segments/bias_correction/fpb_med_corr_sigma',\n", + " 'gt1l/land_ice_segments/bias_correction/fpb_n_corr',\n", + " 'gt1l/land_ice_segments/bias_correction/med_r_fit',\n", + " 'gt1l/land_ice_segments/bias_correction/tx_mean_corr',\n", + " 'gt1l/land_ice_segments/bias_correction/tx_med_corr',\n", + " 'gt1l/land_ice_segments/delta_time',\n", + " 'gt1l/land_ice_segments/dem/dem_flag',\n", + " 'gt1l/land_ice_segments/dem/dem_h',\n", + " 'gt1l/land_ice_segments/dem/geoid_free2mean',\n", + " 'gt1l/land_ice_segments/dem/geoid_h',\n", + " 'gt1l/land_ice_segments/fit_statistics/dh_fit_dx',\n", + " 'gt1l/land_ice_segments/fit_statistics/dh_fit_dx_sigma',\n", + " 'gt1l/land_ice_segments/fit_statistics/dh_fit_dy',\n", + " 'gt1l/land_ice_segments/fit_statistics/h_expected_rms',\n", + " 'gt1l/land_ice_segments/fit_statistics/h_mean',\n", + " 'gt1l/land_ice_segments/fit_statistics/h_rms_misfit',\n", + " 'gt1l/land_ice_segments/fit_statistics/h_robust_sprd',\n", + " 'gt1l/land_ice_segments/fit_statistics/n_fit_photons',\n", + " 'gt1l/land_ice_segments/fit_statistics/n_seg_pulses',\n", + " 'gt1l/land_ice_segments/fit_statistics/sigma_h_mean',\n", + " 'gt1l/land_ice_segments/fit_statistics/signal_selection_source',\n", + " 'gt1l/land_ice_segments/fit_statistics/signal_selection_source_status',\n", + " 'gt1l/land_ice_segments/fit_statistics/snr',\n", + " 'gt1l/land_ice_segments/fit_statistics/snr_significance',\n", + " 'gt1l/land_ice_segments/fit_statistics/w_surface_window_final',\n", + " 'gt1l/land_ice_segments/geophysical/bckgrd',\n", + " 'gt1l/land_ice_segments/geophysical/bsnow_conf',\n", + " 'gt1l/land_ice_segments/geophysical/bsnow_h',\n", + " 'gt1l/land_ice_segments/geophysical/bsnow_od',\n", + " 'gt1l/land_ice_segments/geophysical/cloud_flg_asr',\n", + " 'gt1l/land_ice_segments/geophysical/cloud_flg_atm',\n", + " 'gt1l/land_ice_segments/geophysical/dac',\n", + " 'gt1l/land_ice_segments/geophysical/e_bckgrd',\n", + " 'gt1l/land_ice_segments/geophysical/layer_flag',\n", + " 'gt1l/land_ice_segments/geophysical/msw_flag',\n", + " 'gt1l/land_ice_segments/geophysical/neutat_delay_total',\n", + " 'gt1l/land_ice_segments/geophysical/r_eff',\n", + " 'gt1l/land_ice_segments/geophysical/solar_azimuth',\n", + " 'gt1l/land_ice_segments/geophysical/solar_elevation',\n", + " 'gt1l/land_ice_segments/geophysical/tide_earth',\n", + " 'gt1l/land_ice_segments/geophysical/tide_earth_free2mean',\n", + " 'gt1l/land_ice_segments/geophysical/tide_equilibrium',\n", + " 'gt1l/land_ice_segments/geophysical/tide_load',\n", + " 'gt1l/land_ice_segments/geophysical/tide_ocean',\n", + " 'gt1l/land_ice_segments/geophysical/tide_pole',\n", + " 'gt1l/land_ice_segments/ground_track/ref_azimuth',\n", + " 'gt1l/land_ice_segments/ground_track/ref_coelv',\n", + " 'gt1l/land_ice_segments/ground_track/seg_azimuth',\n", + " 'gt1l/land_ice_segments/ground_track/sigma_geo_at',\n", + " 'gt1l/land_ice_segments/ground_track/sigma_geo_r',\n", + " 'gt1l/land_ice_segments/ground_track/sigma_geo_xt',\n", + " 'gt1l/land_ice_segments/ground_track/x_atc',\n", + " 'gt1l/land_ice_segments/ground_track/y_atc',\n", + " 'gt1l/land_ice_segments/h_li',\n", + " 'gt1l/land_ice_segments/h_li_sigma',\n", + " 'gt1l/land_ice_segments/latitude',\n", + " 'gt1l/land_ice_segments/longitude',\n", + " 'gt1l/land_ice_segments/segment_id',\n", + " 'gt1l/land_ice_segments/sigma_geo_h',\n", + " 'gt1l/residual_histogram/bckgrd_per_m',\n", + " 'gt1l/residual_histogram/bin_top_h',\n", + " 'gt1l/residual_histogram/count',\n", + " 'gt1l/residual_histogram/delta_time',\n", + " 'gt1l/residual_histogram/ds_segment_id',\n", + " 'gt1l/residual_histogram/lat_mean',\n", + " 'gt1l/residual_histogram/lon_mean',\n", + " 'gt1l/residual_histogram/pulse_count',\n", + " 'gt1l/residual_histogram/segment_id_list',\n", + " 'gt1l/residual_histogram/x_atc_mean',\n", + " 'gt1l/segment_quality/delta_time',\n", + " 'gt1l/segment_quality/record_number',\n", + " 'gt1l/segment_quality/reference_pt_lat',\n", + " 'gt1l/segment_quality/reference_pt_lon',\n", + " 'gt1l/segment_quality/segment_id',\n", + " 'gt1l/segment_quality/signal_selection_source',\n", + " 'gt1l/segment_quality/signal_selection_status/signal_selection_status_all',\n", + " 'gt1l/segment_quality/signal_selection_status/signal_selection_status_backup',\n", + " 'gt1l/segment_quality/signal_selection_status/signal_selection_status_confident',\n", + " 'gt1r/land_ice_segments/atl06_quality_summary',\n", + " 'gt1r/land_ice_segments/bias_correction/fpb_mean_corr',\n", + " 'gt1r/land_ice_segments/bias_correction/fpb_mean_corr_sigma',\n", + " 'gt1r/land_ice_segments/bias_correction/fpb_med_corr',\n", + " 'gt1r/land_ice_segments/bias_correction/fpb_med_corr_sigma',\n", + " 'gt1r/land_ice_segments/bias_correction/fpb_n_corr',\n", + " 'gt1r/land_ice_segments/bias_correction/med_r_fit',\n", + " 'gt1r/land_ice_segments/bias_correction/tx_mean_corr',\n", + " 'gt1r/land_ice_segments/bias_correction/tx_med_corr',\n", + " 'gt1r/land_ice_segments/delta_time',\n", + " 'gt1r/land_ice_segments/dem/dem_flag',\n", + " 'gt1r/land_ice_segments/dem/dem_h',\n", + " 'gt1r/land_ice_segments/dem/geoid_free2mean',\n", + " 'gt1r/land_ice_segments/dem/geoid_h',\n", + " 'gt1r/land_ice_segments/fit_statistics/dh_fit_dx',\n", + " 'gt1r/land_ice_segments/fit_statistics/dh_fit_dx_sigma',\n", + " 'gt1r/land_ice_segments/fit_statistics/dh_fit_dy',\n", + " 'gt1r/land_ice_segments/fit_statistics/h_expected_rms',\n", + " 'gt1r/land_ice_segments/fit_statistics/h_mean',\n", + " 'gt1r/land_ice_segments/fit_statistics/h_rms_misfit',\n", + " 'gt1r/land_ice_segments/fit_statistics/h_robust_sprd',\n", + " 'gt1r/land_ice_segments/fit_statistics/n_fit_photons',\n", + " 'gt1r/land_ice_segments/fit_statistics/n_seg_pulses',\n", + " 'gt1r/land_ice_segments/fit_statistics/sigma_h_mean',\n", + " 'gt1r/land_ice_segments/fit_statistics/signal_selection_source',\n", + " 'gt1r/land_ice_segments/fit_statistics/signal_selection_source_status',\n", + " 'gt1r/land_ice_segments/fit_statistics/snr',\n", + " 'gt1r/land_ice_segments/fit_statistics/snr_significance',\n", + " 'gt1r/land_ice_segments/fit_statistics/w_surface_window_final',\n", + " 'gt1r/land_ice_segments/geophysical/bckgrd',\n", + " 'gt1r/land_ice_segments/geophysical/bsnow_conf',\n", + " 'gt1r/land_ice_segments/geophysical/bsnow_h',\n", + " 'gt1r/land_ice_segments/geophysical/bsnow_od',\n", + " 'gt1r/land_ice_segments/geophysical/cloud_flg_asr',\n", + " 'gt1r/land_ice_segments/geophysical/cloud_flg_atm',\n", + " 'gt1r/land_ice_segments/geophysical/dac',\n", + " 'gt1r/land_ice_segments/geophysical/e_bckgrd',\n", + " 'gt1r/land_ice_segments/geophysical/layer_flag',\n", + " 'gt1r/land_ice_segments/geophysical/msw_flag',\n", + " 'gt1r/land_ice_segments/geophysical/neutat_delay_total',\n", + " 'gt1r/land_ice_segments/geophysical/r_eff',\n", + " 'gt1r/land_ice_segments/geophysical/solar_azimuth',\n", + " 'gt1r/land_ice_segments/geophysical/solar_elevation',\n", + " 'gt1r/land_ice_segments/geophysical/tide_earth',\n", + " 'gt1r/land_ice_segments/geophysical/tide_earth_free2mean',\n", + " 'gt1r/land_ice_segments/geophysical/tide_equilibrium',\n", + " 'gt1r/land_ice_segments/geophysical/tide_load',\n", + " 'gt1r/land_ice_segments/geophysical/tide_ocean',\n", + " 'gt1r/land_ice_segments/geophysical/tide_pole',\n", + " 'gt1r/land_ice_segments/ground_track/ref_azimuth',\n", + " 'gt1r/land_ice_segments/ground_track/ref_coelv',\n", + " 'gt1r/land_ice_segments/ground_track/seg_azimuth',\n", + " 'gt1r/land_ice_segments/ground_track/sigma_geo_at',\n", + " 'gt1r/land_ice_segments/ground_track/sigma_geo_r',\n", + " 'gt1r/land_ice_segments/ground_track/sigma_geo_xt',\n", + " 'gt1r/land_ice_segments/ground_track/x_atc',\n", + " 'gt1r/land_ice_segments/ground_track/y_atc',\n", + " 'gt1r/land_ice_segments/h_li',\n", + " 'gt1r/land_ice_segments/h_li_sigma',\n", + " 'gt1r/land_ice_segments/latitude',\n", + " 'gt1r/land_ice_segments/longitude',\n", + " 'gt1r/land_ice_segments/segment_id',\n", + " 'gt1r/land_ice_segments/sigma_geo_h',\n", + " 'gt1r/residual_histogram/bckgrd_per_m',\n", + " 'gt1r/residual_histogram/bin_top_h',\n", + " 'gt1r/residual_histogram/count',\n", + " 'gt1r/residual_histogram/delta_time',\n", + " 'gt1r/residual_histogram/ds_segment_id',\n", + " 'gt1r/residual_histogram/lat_mean',\n", + " 'gt1r/residual_histogram/lon_mean',\n", + " 'gt1r/residual_histogram/pulse_count',\n", + " 'gt1r/residual_histogram/segment_id_list',\n", + " 'gt1r/residual_histogram/x_atc_mean',\n", + " 'gt1r/segment_quality/delta_time',\n", + " 'gt1r/segment_quality/record_number',\n", + " 'gt1r/segment_quality/reference_pt_lat',\n", + " 'gt1r/segment_quality/reference_pt_lon',\n", + " 'gt1r/segment_quality/segment_id',\n", + " 'gt1r/segment_quality/signal_selection_source',\n", + " 'gt1r/segment_quality/signal_selection_status/signal_selection_status_all',\n", + " 'gt1r/segment_quality/signal_selection_status/signal_selection_status_backup',\n", + " 'gt1r/segment_quality/signal_selection_status/signal_selection_status_confident',\n", + " 'gt2l/land_ice_segments/atl06_quality_summary',\n", + " 'gt2l/land_ice_segments/bias_correction/fpb_mean_corr',\n", + " 'gt2l/land_ice_segments/bias_correction/fpb_mean_corr_sigma',\n", + " 'gt2l/land_ice_segments/bias_correction/fpb_med_corr',\n", + " 'gt2l/land_ice_segments/bias_correction/fpb_med_corr_sigma',\n", + " 'gt2l/land_ice_segments/bias_correction/fpb_n_corr',\n", + " 'gt2l/land_ice_segments/bias_correction/med_r_fit',\n", + " 'gt2l/land_ice_segments/bias_correction/tx_mean_corr',\n", + " 'gt2l/land_ice_segments/bias_correction/tx_med_corr',\n", + " 'gt2l/land_ice_segments/delta_time',\n", + " 'gt2l/land_ice_segments/dem/dem_flag',\n", + " 'gt2l/land_ice_segments/dem/dem_h',\n", + " 'gt2l/land_ice_segments/dem/geoid_free2mean',\n", + " 'gt2l/land_ice_segments/dem/geoid_h',\n", + " 'gt2l/land_ice_segments/fit_statistics/dh_fit_dx',\n", + " 'gt2l/land_ice_segments/fit_statistics/dh_fit_dx_sigma',\n", + " 'gt2l/land_ice_segments/fit_statistics/dh_fit_dy',\n", + " 'gt2l/land_ice_segments/fit_statistics/h_expected_rms',\n", + " 'gt2l/land_ice_segments/fit_statistics/h_mean',\n", + " 'gt2l/land_ice_segments/fit_statistics/h_rms_misfit',\n", + " 'gt2l/land_ice_segments/fit_statistics/h_robust_sprd',\n", + " 'gt2l/land_ice_segments/fit_statistics/n_fit_photons',\n", + " 'gt2l/land_ice_segments/fit_statistics/n_seg_pulses',\n", + " 'gt2l/land_ice_segments/fit_statistics/sigma_h_mean',\n", + " 'gt2l/land_ice_segments/fit_statistics/signal_selection_source',\n", + " 'gt2l/land_ice_segments/fit_statistics/signal_selection_source_status',\n", + " 'gt2l/land_ice_segments/fit_statistics/snr',\n", + " 'gt2l/land_ice_segments/fit_statistics/snr_significance',\n", + " 'gt2l/land_ice_segments/fit_statistics/w_surface_window_final',\n", + " 'gt2l/land_ice_segments/geophysical/bckgrd',\n", + " 'gt2l/land_ice_segments/geophysical/bsnow_conf',\n", + " 'gt2l/land_ice_segments/geophysical/bsnow_h',\n", + " 'gt2l/land_ice_segments/geophysical/bsnow_od',\n", + " 'gt2l/land_ice_segments/geophysical/cloud_flg_asr',\n", + " 'gt2l/land_ice_segments/geophysical/cloud_flg_atm',\n", + " 'gt2l/land_ice_segments/geophysical/dac',\n", + " 'gt2l/land_ice_segments/geophysical/e_bckgrd',\n", + " 'gt2l/land_ice_segments/geophysical/layer_flag',\n", + " 'gt2l/land_ice_segments/geophysical/msw_flag',\n", + " 'gt2l/land_ice_segments/geophysical/neutat_delay_total',\n", + " 'gt2l/land_ice_segments/geophysical/r_eff',\n", + " 'gt2l/land_ice_segments/geophysical/solar_azimuth',\n", + " 'gt2l/land_ice_segments/geophysical/solar_elevation',\n", + " 'gt2l/land_ice_segments/geophysical/tide_earth',\n", + " 'gt2l/land_ice_segments/geophysical/tide_earth_free2mean',\n", + " 'gt2l/land_ice_segments/geophysical/tide_equilibrium',\n", + " 'gt2l/land_ice_segments/geophysical/tide_load',\n", + " 'gt2l/land_ice_segments/geophysical/tide_ocean',\n", + " 'gt2l/land_ice_segments/geophysical/tide_pole',\n", + " 'gt2l/land_ice_segments/ground_track/ref_azimuth',\n", + " 'gt2l/land_ice_segments/ground_track/ref_coelv',\n", + " 'gt2l/land_ice_segments/ground_track/seg_azimuth',\n", + " 'gt2l/land_ice_segments/ground_track/sigma_geo_at',\n", + " 'gt2l/land_ice_segments/ground_track/sigma_geo_r',\n", + " 'gt2l/land_ice_segments/ground_track/sigma_geo_xt',\n", + " 'gt2l/land_ice_segments/ground_track/x_atc',\n", + " 'gt2l/land_ice_segments/ground_track/y_atc',\n", + " 'gt2l/land_ice_segments/h_li',\n", + " 'gt2l/land_ice_segments/h_li_sigma',\n", + " 'gt2l/land_ice_segments/latitude',\n", + " 'gt2l/land_ice_segments/longitude',\n", + " 'gt2l/land_ice_segments/segment_id',\n", + " 'gt2l/land_ice_segments/sigma_geo_h',\n", + " 'gt2l/residual_histogram/bckgrd_per_m',\n", + " 'gt2l/residual_histogram/bin_top_h',\n", + " 'gt2l/residual_histogram/count',\n", + " 'gt2l/residual_histogram/delta_time',\n", + " 'gt2l/residual_histogram/ds_segment_id',\n", + " 'gt2l/residual_histogram/lat_mean',\n", + " 'gt2l/residual_histogram/lon_mean',\n", + " 'gt2l/residual_histogram/pulse_count',\n", + " 'gt2l/residual_histogram/segment_id_list',\n", + " 'gt2l/residual_histogram/x_atc_mean',\n", + " 'gt2l/segment_quality/delta_time',\n", + " 'gt2l/segment_quality/record_number',\n", + " 'gt2l/segment_quality/reference_pt_lat',\n", + " 'gt2l/segment_quality/reference_pt_lon',\n", + " 'gt2l/segment_quality/segment_id',\n", + " 'gt2l/segment_quality/signal_selection_source',\n", + " 'gt2l/segment_quality/signal_selection_status/signal_selection_status_all',\n", + " 'gt2l/segment_quality/signal_selection_status/signal_selection_status_backup',\n", + " 'gt2l/segment_quality/signal_selection_status/signal_selection_status_confident',\n", + " 'gt2r/land_ice_segments/atl06_quality_summary',\n", + " 'gt2r/land_ice_segments/bias_correction/fpb_mean_corr',\n", + " 'gt2r/land_ice_segments/bias_correction/fpb_mean_corr_sigma',\n", + " 'gt2r/land_ice_segments/bias_correction/fpb_med_corr',\n", + " 'gt2r/land_ice_segments/bias_correction/fpb_med_corr_sigma',\n", + " 'gt2r/land_ice_segments/bias_correction/fpb_n_corr',\n", + " 'gt2r/land_ice_segments/bias_correction/med_r_fit',\n", + " 'gt2r/land_ice_segments/bias_correction/tx_mean_corr',\n", + " 'gt2r/land_ice_segments/bias_correction/tx_med_corr',\n", + " 'gt2r/land_ice_segments/delta_time',\n", + " 'gt2r/land_ice_segments/dem/dem_flag',\n", + " 'gt2r/land_ice_segments/dem/dem_h',\n", + " 'gt2r/land_ice_segments/dem/geoid_free2mean',\n", + " 'gt2r/land_ice_segments/dem/geoid_h',\n", + " 'gt2r/land_ice_segments/fit_statistics/dh_fit_dx',\n", + " 'gt2r/land_ice_segments/fit_statistics/dh_fit_dx_sigma',\n", + " 'gt2r/land_ice_segments/fit_statistics/dh_fit_dy',\n", + " 'gt2r/land_ice_segments/fit_statistics/h_expected_rms',\n", + " 'gt2r/land_ice_segments/fit_statistics/h_mean',\n", + " 'gt2r/land_ice_segments/fit_statistics/h_rms_misfit',\n", + " 'gt2r/land_ice_segments/fit_statistics/h_robust_sprd',\n", + " 'gt2r/land_ice_segments/fit_statistics/n_fit_photons',\n", + " 'gt2r/land_ice_segments/fit_statistics/n_seg_pulses',\n", + " 'gt2r/land_ice_segments/fit_statistics/sigma_h_mean',\n", + " 'gt2r/land_ice_segments/fit_statistics/signal_selection_source',\n", + " 'gt2r/land_ice_segments/fit_statistics/signal_selection_source_status',\n", + " 'gt2r/land_ice_segments/fit_statistics/snr',\n", + " 'gt2r/land_ice_segments/fit_statistics/snr_significance',\n", + " 'gt2r/land_ice_segments/fit_statistics/w_surface_window_final',\n", + " 'gt2r/land_ice_segments/geophysical/bckgrd',\n", + " 'gt2r/land_ice_segments/geophysical/bsnow_conf',\n", + " 'gt2r/land_ice_segments/geophysical/bsnow_h',\n", + " 'gt2r/land_ice_segments/geophysical/bsnow_od',\n", + " 'gt2r/land_ice_segments/geophysical/cloud_flg_asr',\n", + " 'gt2r/land_ice_segments/geophysical/cloud_flg_atm',\n", + " 'gt2r/land_ice_segments/geophysical/dac',\n", + " 'gt2r/land_ice_segments/geophysical/e_bckgrd',\n", + " 'gt2r/land_ice_segments/geophysical/layer_flag',\n", + " 'gt2r/land_ice_segments/geophysical/msw_flag',\n", + " 'gt2r/land_ice_segments/geophysical/neutat_delay_total',\n", + " 'gt2r/land_ice_segments/geophysical/r_eff',\n", + " 'gt2r/land_ice_segments/geophysical/solar_azimuth',\n", + " 'gt2r/land_ice_segments/geophysical/solar_elevation',\n", + " 'gt2r/land_ice_segments/geophysical/tide_earth',\n", + " 'gt2r/land_ice_segments/geophysical/tide_earth_free2mean',\n", + " 'gt2r/land_ice_segments/geophysical/tide_equilibrium',\n", + " 'gt2r/land_ice_segments/geophysical/tide_load',\n", + " 'gt2r/land_ice_segments/geophysical/tide_ocean',\n", + " 'gt2r/land_ice_segments/geophysical/tide_pole',\n", + " 'gt2r/land_ice_segments/ground_track/ref_azimuth',\n", + " 'gt2r/land_ice_segments/ground_track/ref_coelv',\n", + " 'gt2r/land_ice_segments/ground_track/seg_azimuth',\n", + " 'gt2r/land_ice_segments/ground_track/sigma_geo_at',\n", + " 'gt2r/land_ice_segments/ground_track/sigma_geo_r',\n", + " 'gt2r/land_ice_segments/ground_track/sigma_geo_xt',\n", + " 'gt2r/land_ice_segments/ground_track/x_atc',\n", + " 'gt2r/land_ice_segments/ground_track/y_atc',\n", + " 'gt2r/land_ice_segments/h_li',\n", + " 'gt2r/land_ice_segments/h_li_sigma',\n", + " 'gt2r/land_ice_segments/latitude',\n", + " 'gt2r/land_ice_segments/longitude',\n", + " 'gt2r/land_ice_segments/segment_id',\n", + " 'gt2r/land_ice_segments/sigma_geo_h',\n", + " 'gt2r/residual_histogram/bckgrd_per_m',\n", + " 'gt2r/residual_histogram/bin_top_h',\n", + " 'gt2r/residual_histogram/count',\n", + " 'gt2r/residual_histogram/delta_time',\n", + " 'gt2r/residual_histogram/ds_segment_id',\n", + " 'gt2r/residual_histogram/lat_mean',\n", + " 'gt2r/residual_histogram/lon_mean',\n", + " 'gt2r/residual_histogram/pulse_count',\n", + " 'gt2r/residual_histogram/segment_id_list',\n", + " 'gt2r/residual_histogram/x_atc_mean',\n", + " 'gt2r/segment_quality/delta_time',\n", + " 'gt2r/segment_quality/record_number',\n", + " 'gt2r/segment_quality/reference_pt_lat',\n", + " 'gt2r/segment_quality/reference_pt_lon',\n", + " 'gt2r/segment_quality/segment_id',\n", + " 'gt2r/segment_quality/signal_selection_source',\n", + " 'gt2r/segment_quality/signal_selection_status/signal_selection_status_all',\n", + " 'gt2r/segment_quality/signal_selection_status/signal_selection_status_backup',\n", + " 'gt2r/segment_quality/signal_selection_status/signal_selection_status_confident',\n", + " 'gt3l/land_ice_segments/atl06_quality_summary',\n", + " 'gt3l/land_ice_segments/bias_correction/fpb_mean_corr',\n", + " 'gt3l/land_ice_segments/bias_correction/fpb_mean_corr_sigma',\n", + " 'gt3l/land_ice_segments/bias_correction/fpb_med_corr',\n", + " 'gt3l/land_ice_segments/bias_correction/fpb_med_corr_sigma',\n", + " 'gt3l/land_ice_segments/bias_correction/fpb_n_corr',\n", + " 'gt3l/land_ice_segments/bias_correction/med_r_fit',\n", + " 'gt3l/land_ice_segments/bias_correction/tx_mean_corr',\n", + " 'gt3l/land_ice_segments/bias_correction/tx_med_corr',\n", + " 'gt3l/land_ice_segments/delta_time',\n", + " 'gt3l/land_ice_segments/dem/dem_flag',\n", + " 'gt3l/land_ice_segments/dem/dem_h',\n", + " 'gt3l/land_ice_segments/dem/geoid_free2mean',\n", + " 'gt3l/land_ice_segments/dem/geoid_h',\n", + " 'gt3l/land_ice_segments/fit_statistics/dh_fit_dx',\n", + " 'gt3l/land_ice_segments/fit_statistics/dh_fit_dx_sigma',\n", + " 'gt3l/land_ice_segments/fit_statistics/dh_fit_dy',\n", + " 'gt3l/land_ice_segments/fit_statistics/h_expected_rms',\n", + " 'gt3l/land_ice_segments/fit_statistics/h_mean',\n", + " 'gt3l/land_ice_segments/fit_statistics/h_rms_misfit',\n", + " 'gt3l/land_ice_segments/fit_statistics/h_robust_sprd',\n", + " 'gt3l/land_ice_segments/fit_statistics/n_fit_photons',\n", + " 'gt3l/land_ice_segments/fit_statistics/n_seg_pulses',\n", + " 'gt3l/land_ice_segments/fit_statistics/sigma_h_mean',\n", + " 'gt3l/land_ice_segments/fit_statistics/signal_selection_source',\n", + " 'gt3l/land_ice_segments/fit_statistics/signal_selection_source_status',\n", + " 'gt3l/land_ice_segments/fit_statistics/snr',\n", + " 'gt3l/land_ice_segments/fit_statistics/snr_significance',\n", + " 'gt3l/land_ice_segments/fit_statistics/w_surface_window_final',\n", + " 'gt3l/land_ice_segments/geophysical/bckgrd',\n", + " 'gt3l/land_ice_segments/geophysical/bsnow_conf',\n", + " 'gt3l/land_ice_segments/geophysical/bsnow_h',\n", + " 'gt3l/land_ice_segments/geophysical/bsnow_od',\n", + " 'gt3l/land_ice_segments/geophysical/cloud_flg_asr',\n", + " 'gt3l/land_ice_segments/geophysical/cloud_flg_atm',\n", + " 'gt3l/land_ice_segments/geophysical/dac',\n", + " 'gt3l/land_ice_segments/geophysical/e_bckgrd',\n", + " 'gt3l/land_ice_segments/geophysical/layer_flag',\n", + " 'gt3l/land_ice_segments/geophysical/msw_flag',\n", + " 'gt3l/land_ice_segments/geophysical/neutat_delay_total',\n", + " 'gt3l/land_ice_segments/geophysical/r_eff',\n", + " 'gt3l/land_ice_segments/geophysical/solar_azimuth',\n", + " 'gt3l/land_ice_segments/geophysical/solar_elevation',\n", + " 'gt3l/land_ice_segments/geophysical/tide_earth',\n", + " 'gt3l/land_ice_segments/geophysical/tide_earth_free2mean',\n", + " 'gt3l/land_ice_segments/geophysical/tide_equilibrium',\n", + " 'gt3l/land_ice_segments/geophysical/tide_load',\n", + " 'gt3l/land_ice_segments/geophysical/tide_ocean',\n", + " 'gt3l/land_ice_segments/geophysical/tide_pole',\n", + " 'gt3l/land_ice_segments/ground_track/ref_azimuth',\n", + " 'gt3l/land_ice_segments/ground_track/ref_coelv',\n", + " 'gt3l/land_ice_segments/ground_track/seg_azimuth',\n", + " 'gt3l/land_ice_segments/ground_track/sigma_geo_at',\n", + " 'gt3l/land_ice_segments/ground_track/sigma_geo_r',\n", + " 'gt3l/land_ice_segments/ground_track/sigma_geo_xt',\n", + " 'gt3l/land_ice_segments/ground_track/x_atc',\n", + " 'gt3l/land_ice_segments/ground_track/y_atc',\n", + " 'gt3l/land_ice_segments/h_li',\n", + " 'gt3l/land_ice_segments/h_li_sigma',\n", + " 'gt3l/land_ice_segments/latitude',\n", + " 'gt3l/land_ice_segments/longitude',\n", + " 'gt3l/land_ice_segments/segment_id',\n", + " 'gt3l/land_ice_segments/sigma_geo_h',\n", + " 'gt3l/residual_histogram/bckgrd_per_m',\n", + " 'gt3l/residual_histogram/bin_top_h',\n", + " 'gt3l/residual_histogram/count',\n", + " 'gt3l/residual_histogram/delta_time',\n", + " 'gt3l/residual_histogram/ds_segment_id',\n", + " 'gt3l/residual_histogram/lat_mean',\n", + " 'gt3l/residual_histogram/lon_mean',\n", + " 'gt3l/residual_histogram/pulse_count',\n", + " 'gt3l/residual_histogram/segment_id_list',\n", + " 'gt3l/residual_histogram/x_atc_mean',\n", + " 'gt3l/segment_quality/delta_time',\n", + " 'gt3l/segment_quality/record_number',\n", + " 'gt3l/segment_quality/reference_pt_lat',\n", + " 'gt3l/segment_quality/reference_pt_lon',\n", + " 'gt3l/segment_quality/segment_id',\n", + " 'gt3l/segment_quality/signal_selection_source',\n", + " 'gt3l/segment_quality/signal_selection_status/signal_selection_status_all',\n", + " 'gt3l/segment_quality/signal_selection_status/signal_selection_status_backup',\n", + " 'gt3l/segment_quality/signal_selection_status/signal_selection_status_confident',\n", + " 'gt3r/land_ice_segments/atl06_quality_summary',\n", + " 'gt3r/land_ice_segments/bias_correction/fpb_mean_corr',\n", + " 'gt3r/land_ice_segments/bias_correction/fpb_mean_corr_sigma',\n", + " 'gt3r/land_ice_segments/bias_correction/fpb_med_corr',\n", + " 'gt3r/land_ice_segments/bias_correction/fpb_med_corr_sigma',\n", + " 'gt3r/land_ice_segments/bias_correction/fpb_n_corr',\n", + " 'gt3r/land_ice_segments/bias_correction/med_r_fit',\n", + " 'gt3r/land_ice_segments/bias_correction/tx_mean_corr',\n", + " 'gt3r/land_ice_segments/bias_correction/tx_med_corr',\n", + " 'gt3r/land_ice_segments/delta_time',\n", + " 'gt3r/land_ice_segments/dem/dem_flag',\n", + " 'gt3r/land_ice_segments/dem/dem_h',\n", + " 'gt3r/land_ice_segments/dem/geoid_free2mean',\n", + " 'gt3r/land_ice_segments/dem/geoid_h',\n", + " 'gt3r/land_ice_segments/fit_statistics/dh_fit_dx',\n", + " 'gt3r/land_ice_segments/fit_statistics/dh_fit_dx_sigma',\n", + " 'gt3r/land_ice_segments/fit_statistics/dh_fit_dy',\n", + " 'gt3r/land_ice_segments/fit_statistics/h_expected_rms',\n", + " 'gt3r/land_ice_segments/fit_statistics/h_mean',\n", + " 'gt3r/land_ice_segments/fit_statistics/h_rms_misfit',\n", + " 'gt3r/land_ice_segments/fit_statistics/h_robust_sprd',\n", + " 'gt3r/land_ice_segments/fit_statistics/n_fit_photons',\n", + " 'gt3r/land_ice_segments/fit_statistics/n_seg_pulses',\n", + " 'gt3r/land_ice_segments/fit_statistics/sigma_h_mean',\n", + " 'gt3r/land_ice_segments/fit_statistics/signal_selection_source',\n", + " 'gt3r/land_ice_segments/fit_statistics/signal_selection_source_status',\n", + " 'gt3r/land_ice_segments/fit_statistics/snr',\n", + " 'gt3r/land_ice_segments/fit_statistics/snr_significance',\n", + " 'gt3r/land_ice_segments/fit_statistics/w_surface_window_final',\n", + " 'gt3r/land_ice_segments/geophysical/bckgrd',\n", + " 'gt3r/land_ice_segments/geophysical/bsnow_conf',\n", + " 'gt3r/land_ice_segments/geophysical/bsnow_h',\n", + " 'gt3r/land_ice_segments/geophysical/bsnow_od',\n", + " 'gt3r/land_ice_segments/geophysical/cloud_flg_asr',\n", + " 'gt3r/land_ice_segments/geophysical/cloud_flg_atm',\n", + " 'gt3r/land_ice_segments/geophysical/dac',\n", + " 'gt3r/land_ice_segments/geophysical/e_bckgrd',\n", + " 'gt3r/land_ice_segments/geophysical/layer_flag',\n", + " 'gt3r/land_ice_segments/geophysical/msw_flag',\n", + " 'gt3r/land_ice_segments/geophysical/neutat_delay_total',\n", + " 'gt3r/land_ice_segments/geophysical/r_eff',\n", + " 'gt3r/land_ice_segments/geophysical/solar_azimuth',\n", + " 'gt3r/land_ice_segments/geophysical/solar_elevation',\n", + " 'gt3r/land_ice_segments/geophysical/tide_earth',\n", + " 'gt3r/land_ice_segments/geophysical/tide_earth_free2mean',\n", + " 'gt3r/land_ice_segments/geophysical/tide_equilibrium',\n", + " 'gt3r/land_ice_segments/geophysical/tide_load',\n", + " 'gt3r/land_ice_segments/geophysical/tide_ocean',\n", + " 'gt3r/land_ice_segments/geophysical/tide_pole',\n", + " 'gt3r/land_ice_segments/ground_track/ref_azimuth',\n", + " 'gt3r/land_ice_segments/ground_track/ref_coelv',\n", + " 'gt3r/land_ice_segments/ground_track/seg_azimuth',\n", + " 'gt3r/land_ice_segments/ground_track/sigma_geo_at',\n", + " 'gt3r/land_ice_segments/ground_track/sigma_geo_r',\n", + " 'gt3r/land_ice_segments/ground_track/sigma_geo_xt',\n", + " 'gt3r/land_ice_segments/ground_track/x_atc',\n", + " 'gt3r/land_ice_segments/ground_track/y_atc',\n", + " 'gt3r/land_ice_segments/h_li',\n", + " 'gt3r/land_ice_segments/h_li_sigma',\n", + " 'gt3r/land_ice_segments/latitude',\n", + " 'gt3r/land_ice_segments/longitude',\n", + " 'gt3r/land_ice_segments/segment_id',\n", + " 'gt3r/land_ice_segments/sigma_geo_h',\n", + " 'gt3r/residual_histogram/bckgrd_per_m',\n", + " 'gt3r/residual_histogram/bin_top_h',\n", + " 'gt3r/residual_histogram/count',\n", + " 'gt3r/residual_histogram/delta_time',\n", + " 'gt3r/residual_histogram/ds_segment_id',\n", + " 'gt3r/residual_histogram/lat_mean',\n", + " 'gt3r/residual_histogram/lon_mean',\n", + " 'gt3r/residual_histogram/pulse_count',\n", + " 'gt3r/residual_histogram/segment_id_list',\n", + " 'gt3r/residual_histogram/x_atc_mean',\n", + " 'gt3r/segment_quality/delta_time',\n", + " 'gt3r/segment_quality/record_number',\n", + " 'gt3r/segment_quality/reference_pt_lat',\n", + " 'gt3r/segment_quality/reference_pt_lon',\n", + " 'gt3r/segment_quality/segment_id',\n", + " 'gt3r/segment_quality/signal_selection_source',\n", + " 'gt3r/segment_quality/signal_selection_status/signal_selection_status_all',\n", + " 'gt3r/segment_quality/signal_selection_status/signal_selection_status_backup',\n", + " 'gt3r/segment_quality/signal_selection_status/signal_selection_status_confident',\n", + " 'orbit_info/bounding_polygon_lat1',\n", + " 'orbit_info/bounding_polygon_lon1',\n", + " 'orbit_info/crossing_time',\n", + " 'orbit_info/cycle_number',\n", + " 'orbit_info/lan',\n", + " 'orbit_info/orbit_number',\n", + " 'orbit_info/rgt',\n", + " 'orbit_info/sc_orient',\n", + " 'orbit_info/sc_orient_time',\n", + " 'quality_assessment/gt1l/delta_time',\n", + " 'quality_assessment/gt1l/lat_mean',\n", + " 'quality_assessment/gt1l/lon_mean',\n", + " 'quality_assessment/gt1l/signal_selection_source_fraction_0',\n", + " 'quality_assessment/gt1l/signal_selection_source_fraction_1',\n", + " 'quality_assessment/gt1l/signal_selection_source_fraction_2',\n", + " 'quality_assessment/gt1l/signal_selection_source_fraction_3',\n", + " 'quality_assessment/gt1r/delta_time',\n", + " 'quality_assessment/gt1r/lat_mean',\n", + " 'quality_assessment/gt1r/lon_mean',\n", + " 'quality_assessment/gt1r/signal_selection_source_fraction_0',\n", + " 'quality_assessment/gt1r/signal_selection_source_fraction_1',\n", + " 'quality_assessment/gt1r/signal_selection_source_fraction_2',\n", + " 'quality_assessment/gt1r/signal_selection_source_fraction_3',\n", + " 'quality_assessment/gt2l/delta_time',\n", + " 'quality_assessment/gt2l/lat_mean',\n", + " 'quality_assessment/gt2l/lon_mean',\n", + " 'quality_assessment/gt2l/signal_selection_source_fraction_0',\n", + " 'quality_assessment/gt2l/signal_selection_source_fraction_1',\n", + " 'quality_assessment/gt2l/signal_selection_source_fraction_2',\n", + " 'quality_assessment/gt2l/signal_selection_source_fraction_3',\n", + " 'quality_assessment/gt2r/delta_time',\n", + " 'quality_assessment/gt2r/lat_mean',\n", + " 'quality_assessment/gt2r/lon_mean',\n", + " 'quality_assessment/gt2r/signal_selection_source_fraction_0',\n", + " 'quality_assessment/gt2r/signal_selection_source_fraction_1',\n", + " 'quality_assessment/gt2r/signal_selection_source_fraction_2',\n", + " 'quality_assessment/gt2r/signal_selection_source_fraction_3',\n", + " 'quality_assessment/gt3l/delta_time',\n", + " 'quality_assessment/gt3l/lat_mean',\n", + " 'quality_assessment/gt3l/lon_mean',\n", + " 'quality_assessment/gt3l/signal_selection_source_fraction_0',\n", + " 'quality_assessment/gt3l/signal_selection_source_fraction_1',\n", + " 'quality_assessment/gt3l/signal_selection_source_fraction_2',\n", + " 'quality_assessment/gt3l/signal_selection_source_fraction_3',\n", + " 'quality_assessment/gt3r/delta_time',\n", + " 'quality_assessment/gt3r/lat_mean',\n", + " 'quality_assessment/gt3r/lon_mean',\n", + " 'quality_assessment/gt3r/signal_selection_source_fraction_0',\n", + " 'quality_assessment/gt3r/signal_selection_source_fraction_1',\n", + " 'quality_assessment/gt3r/signal_selection_source_fraction_2',\n", + " 'quality_assessment/gt3r/signal_selection_source_fraction_3',\n", + " 'quality_assessment/qa_granule_fail_reason',\n", + " 'quality_assessment/qa_granule_pass_fail']" + ] + }, + "execution_count": 21, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "reader.vars.avail()" ] @@ -333,7 +1610,9 @@ { "cell_type": "markdown", "id": "b2449941", - "metadata": {}, + "metadata": { + "user_expressions": [] + }, "source": [ "To make things easier, you can use icepyx's built-in default list that loads commonly used variables for your non-gridded data product, or create your own list of variables to be read in.\n", "icepyx will determine what variables are available for you to read in by creating a list from one of your source files.\n", @@ -349,7 +1628,9 @@ { "cell_type": "markdown", "id": "55092d1b", - "metadata": {}, + "metadata": { + "user_expressions": [] + }, "source": [ "For a basic case, let's say we want to read in height, latitude, and longitude for all beam pairs.\n", "We create our variables list as" @@ -357,7 +1638,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 28, "id": "e3734e09", "metadata": {}, "outputs": [], @@ -368,17 +1649,53 @@ { "cell_type": "markdown", "id": "fff0bb19", - "metadata": {}, + "metadata": { + "user_expressions": [] + }, "source": [ "Then we can view a dictionary of the variables we'd like to read in." ] }, { "cell_type": "code", - "execution_count": null, + "execution_count": 29, "id": "e5456e36", "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "{'sc_orient': ['orbit_info/sc_orient'],\n", + " 'atlas_sdp_gps_epoch': ['ancillary_data/atlas_sdp_gps_epoch'],\n", + " 'cycle_number': ['orbit_info/cycle_number'],\n", + " 'rgt': ['orbit_info/rgt'],\n", + " 'data_start_utc': ['ancillary_data/data_start_utc'],\n", + " 'data_end_utc': ['ancillary_data/data_end_utc'],\n", + " 'h_li': ['gt1l/land_ice_segments/h_li',\n", + " 'gt1r/land_ice_segments/h_li',\n", + " 'gt2l/land_ice_segments/h_li',\n", + " 'gt2r/land_ice_segments/h_li',\n", + " 'gt3l/land_ice_segments/h_li',\n", + " 'gt3r/land_ice_segments/h_li'],\n", + " 'latitude': ['gt1l/land_ice_segments/latitude',\n", + " 'gt1r/land_ice_segments/latitude',\n", + " 'gt2l/land_ice_segments/latitude',\n", + " 'gt2r/land_ice_segments/latitude',\n", + " 'gt3l/land_ice_segments/latitude',\n", + " 'gt3r/land_ice_segments/latitude'],\n", + " 'longitude': ['gt1l/land_ice_segments/longitude',\n", + " 'gt1r/land_ice_segments/longitude',\n", + " 'gt2l/land_ice_segments/longitude',\n", + " 'gt2r/land_ice_segments/longitude',\n", + " 'gt3l/land_ice_segments/longitude',\n", + " 'gt3r/land_ice_segments/longitude']}" + ] + }, + "execution_count": 29, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "reader.vars.wanted" ] @@ -386,14 +1703,16 @@ { "cell_type": "markdown", "id": "9d5b50b5", - "metadata": {}, + "metadata": { + "user_expressions": [] + }, "source": [ "Don't forget - if you need to start over, and re-generate your wanted variables list, it's easy!" ] }, { "cell_type": "code", - "execution_count": null, + "execution_count": 24, "id": "69894391", "metadata": {}, "outputs": [], @@ -404,7 +1723,9 @@ { "cell_type": "markdown", "id": "473de4d7", - "metadata": {}, + "metadata": { + "user_expressions": [] + }, "source": [ "### Step 5: Loading your data\n", "\n", @@ -414,9 +1735,120 @@ { "cell_type": "code", "execution_count": null, - "id": "eaabc976", + "id": "4a66d889-8d2d-4b9a-821a-96a394ff8d66", "metadata": {}, "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": 30, + "id": "eaabc976", + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", + " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", + " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", + " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", + " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", + " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", + " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", + " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", + " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", + " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", + " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", + " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", + " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n", + "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", + " .rename({\"delta_time\": \"photon_idx\"})\n" + ] + } + ], "source": [ "ds = reader.load()" ] @@ -424,7 +1856,9 @@ { "cell_type": "markdown", "id": "db6560f1", - "metadata": {}, + "metadata": { + "user_expressions": [] + }, "source": [ "Within a Jupyter Notebook, you can get a summary view of your data object.\n", "\n", @@ -435,10 +1869,549 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 26, "id": "723256f7", "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "
<xarray.Dataset>\n",
+       "Dimensions:              (photon_idx: 29027, spot: 2, gran_idx: 6)\n",
+       "Coordinates:\n",
+       "  * photon_idx           (photon_idx) int64 0 1 2 3 ... 29023 29024 29025 29026\n",
+       "  * spot                 (spot) uint8 2 5\n",
+       "  * gran_idx             (gran_idx) float64 8.49e+04 9.02e+04 ... 1.016e+05\n",
+       "    source_file          (gran_idx) <U72 '../../../../data/ATL06/processed_AT...\n",
+       "    delta_time           (gran_idx, photon_idx) datetime64[ns] 2019-02-22T01:...\n",
+       "Data variables:\n",
+       "    sc_orient            (gran_idx) int8 0 0 0 1 1 1\n",
+       "    cycle_number         (gran_idx) int8 2 2 2 5 5 5\n",
+       "    rgt                  (gran_idx) int16 849 902 910 986 1001 1016\n",
+       "    atlas_sdp_gps_epoch  (gran_idx) datetime64[ns] 2018-01-01T00:00:18 ... 20...\n",
+       "    data_start_utc       (gran_idx) datetime64[ns] 2019-02-22T01:03:44.199777...\n",
+       "    data_end_utc         (gran_idx) datetime64[ns] 2019-02-22T01:07:38.112326...\n",
+       "    h_li                 (spot, gran_idx, photon_idx) float32 nan nan ... nan\n",
+       "    latitude             (spot, gran_idx, photon_idx) float64 nan nan ... nan\n",
+       "    longitude            (spot, gran_idx, photon_idx) float64 nan nan ... nan\n",
+       "    gt                   (gran_idx, spot) <U4 'gt3r' 'gt1l' ... 'gt1l' 'gt3r'\n",
+       "Attributes:\n",
+       "    data_product:  ATL06\n",
+       "    Description:   The land_ice_height group contains the primary set of deri...\n",
+       "    data_rate:     Data within this group are sparse.  Data values are provid...
" + ], + "text/plain": [ + "\n", + "Dimensions: (photon_idx: 29027, spot: 2, gran_idx: 6)\n", + "Coordinates:\n", + " * photon_idx (photon_idx) int64 0 1 2 3 ... 29023 29024 29025 29026\n", + " * spot (spot) uint8 2 5\n", + " * gran_idx (gran_idx) float64 8.49e+04 9.02e+04 ... 1.016e+05\n", + " source_file (gran_idx) " + ] + }, + "execution_count": 27, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "ds.plot.scatter(x=\"longitude\", y=\"latitude\", hue=\"h_li\", vmin=-100, vmax=2000)" ] @@ -469,7 +2455,9 @@ { "cell_type": "markdown", "id": "6421f67c", - "metadata": {}, + "metadata": { + "user_expressions": [] + }, "source": [ "A developer note to users:\n", "our next steps will be to create an xarray extension with ICESat-2 aware functions (like \"get_strong_beams\", etc.).\n", @@ -478,191 +2466,39 @@ }, { "cell_type": "markdown", - "id": "6edfbb25", - "metadata": {}, - "source": [ - "### More on Intake catalogs and the read object\n", - "\n", - "As anyone familiar with ICESat-2 hdf5 files knows, one of the challenges to reading in data is looping through all of the beam pairs for each track.\n", - "The icepyx read module takes advantage of icepyx's variables module, which has some awareness of ICESat-2 data and uses that to save the user the trouble of having to loop through each beam pair.\n", - "The `reader.load()` function does this by automatically creating minimal Intake catalogs for each variable path, reading in the data, and merging each variable into a ready-to-analyze Xarray DataSet.\n", - "The Intake savvy user may wish to view the template catalog or use an existing catalog." - ] - }, - { - "cell_type": "markdown", - "id": "0f0076f9", - "metadata": {}, - "source": [ - "#### Viewing the template catalog\n", - "\n", - "You can access the ICESat-2 catalog template as an attribute of the read object.\n", - "\n", - "***NOTE: accessing `reader.is2catalog` creates a template with a placeholder in the 'group' parameter; thus, it will not work to actually read in data***" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "2de29fd8", + "id": "1b0cb477", "metadata": { - "scrolled": true + "user_expressions": [] }, - "outputs": [], - "source": [ - "reader.is2catalog" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "7a5deef8", - "metadata": {}, - "outputs": [], - "source": [ - "reader.is2catalog.gui" - ] - }, - { - "cell_type": "markdown", - "id": "fef43556", - "metadata": {}, - "source": [ - "#### Use an existing catalog\n", - "If you already have a catalog for your data, you can supply that when you create the read object." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "64986a60", - "metadata": {}, - "outputs": [], - "source": [ - "catpath = path_root + 'test_catalog.yml'\n", - "reader = ipx.Read(filepath, pattern, catpath)" - ] - }, - { - "cell_type": "markdown", - "id": "cf930e0a", - "metadata": {}, - "source": [ - "Then, you can use the catalog you supplied by calling intake's `read` directly to read in the specified data variable." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "dd0e086a", - "metadata": {}, - "outputs": [], - "source": [ - "ds = reader.is2catalog.read()" - ] - }, - { - "cell_type": "markdown", - "id": "60b1a304", - "metadata": {}, "source": [ - "***NOTE: this means that you will only be able to read in a single data variable!***\n", - "\n", - "To take advantage of icepyx's knowledge of ICESat-2 data nesting of beam pairs and read in multiple related variables at once, you must use the variable approach outlined earlier in this tutorial." + "#### Credits\n", + "* original notebook by: Jessica Scheick\n", + "* notebook contributors: Wei Ji and Tian\n", + "* templates for default ICESat-2 Intake catalogs from: [Wei Ji](https://github.com/icesat2py/icepyx/issues/106) and [Tian](https://github.com/icetianli/ICESat2_xarray)." ] }, { "cell_type": "code", "execution_count": null, - "id": "f5e3a221", - "metadata": {}, - "outputs": [], - "source": [ - "ds = reader.load()\n", - "ds" - ] - }, - { - "cell_type": "markdown", - "id": "d56fc41c", + "id": "aaf6f5a6-355b-456a-99fd-ce0b51045b58", "metadata": {}, - "source": [ - "### More customization options\n", - "\n", - "If you'd like to use the icepyx ICESat-2 Catalog template to create your own customized catalog, we recommend that you access the `build_catalog` function directly, which returns an Intake Catalog instance.\n", - "\n", - "You'll need to supply the required `data_source`, `path_pattern`, and `source_type` arguments. `data_source` and `path_pattern` are described in Steps 2 and 3 of this tutorial. `source_type` is the string you'd like to use for your Local Catalog entry.\n", - "\n", - "This function accepts as keyword input arguments (kwargs) dictionaries with appropriate keys (depending on the Intake driver you are using).\n", - "The simplest version of this is specifying the variable parameters and paths of interest.\n", - "`grp_paths` may contain \"variables\", each of which must then be further defined by `grp_path_params`.\n", - "You cannot use glob-like path syntax to access variables (so `grp_path = '/*/land_ice_segments'` is NOT VALID)." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "f174f885", - "metadata": { - "scrolled": true - }, "outputs": [], - "source": [ - "import icepyx.core.is2cat as is2cat\n", - "\n", - "# build a custom ICESat-2 catalog with a group and parameter\n", - "cat = is2cat.build_catalog(data_source = path_root,\n", - " path_pattern = pattern,\n", - " source_type = \"manual_catalog\",\n", - " grp_paths = \"/{{gt}}/land_ice_segments\",\n", - " grp_path_params = [{\"name\": \"gt\",\n", - " \"description\": \"Ground track\",\n", - " \"type\": \"str\",\n", - " \"default\": \"gt1l\",\n", - " \"allowed\": [\"gt1l\", \"gt1r\", \"gt2l\", \"gt2r\", \"gt3l\", \"gt3r\"]\n", - " }]\n", - " )" - ] - }, - { - "cell_type": "markdown", - "id": "bab9c949", - "metadata": {}, - "source": [ - "#### Saving your catalog\n", - "If you create a highly customized ICESat-2 catalog, you can use Intake's `save` to export it as a .yml file.\n", - "\n", - "Don't forget you can easily use an existing catalog (such as this highly customized one you just made) to read in your data with `reader = ipx.Read(filepath, pattern, catalog)` (so it's as easy as re-creating your reader object with your modified catalog)." - ] + "source": [] }, { "cell_type": "code", "execution_count": null, - "id": "30f0122a", + "id": "8ea1987f-b6bf-44df-a869-949290f498cb", "metadata": {}, "outputs": [], - "source": [ - "catpath = path_root + 'test_catalog.yml'\n", - "cat.save(catpath)" - ] - }, - { - "cell_type": "markdown", - "id": "1b0cb477", - "metadata": {}, - "source": [ - "#### Credits\n", - "* original notebook by: Jessica Scheick\n", - "* notebook contributors: Wei Ji and Tian\n", - "* templates for default ICESat-2 Intake catalogs from: [Wei Ji](https://github.com/icesat2py/icepyx/issues/106) and [Tian](https://github.com/icetianli/ICESat2_xarray)." - ] + "source": [] } ], "metadata": { "kernelspec": { - "display_name": "Python 3 (ipykernel)", + "display_name": "general", "language": "python", - "name": "python3" + "name": "general" }, "language_info": { "codemirror_mode": { @@ -674,7 +2510,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.10.12" + "version": "3.11.4" } }, "nbformat": 4, diff --git a/doc/source/user_guide/documentation/read.rst b/doc/source/user_guide/documentation/read.rst index b076ef210..a5beedf4e 100644 --- a/doc/source/user_guide/documentation/read.rst +++ b/doc/source/user_guide/documentation/read.rst @@ -19,7 +19,6 @@ Attributes .. autosummary:: :toctree: ../../_icepyx/ - Read.is2catalog Read.vars From 9f066112c8b73200128e18eed8e6242d15329da6 Mon Sep 17 00:00:00 2001 From: Rachel Wegener Date: Wed, 30 Aug 2023 20:52:51 +0000 Subject: [PATCH 07/30] update approach paragraph --- doc/source/example_notebooks/IS2_data_read-in.ipynb | 5 +---- 1 file changed, 1 insertion(+), 4 deletions(-) diff --git a/doc/source/example_notebooks/IS2_data_read-in.ipynb b/doc/source/example_notebooks/IS2_data_read-in.ipynb index b8697b1d7..c459b7c78 100644 --- a/doc/source/example_notebooks/IS2_data_read-in.ipynb +++ b/doc/source/example_notebooks/IS2_data_read-in.ipynb @@ -22,10 +22,7 @@ "Instead of needing to manually iterate through the beam pairs, you can provide a few options to the `Read` object and icepyx will do the heavy lifting for you (as detailed in this notebook).\n", "\n", "### Approach\n", - "If you're interested in what's happening under the hood: icepyx turns your instructions into something called a catalog, then uses the Intake library and the catalog to actually load the data into memory. Specifically, icepyx creates an [Intake](https://intake.readthedocs.io/en/latest/) data [catalog](https://intake.readthedocs.io/en/latest/catalog.html) for each requested variable and then merges the read-in data from each of the variables to create a single data object.\n", - "\n", - "Intake catalogs are powerful (and the tool we selected) because they can be saved, shared, modified, and reused to reproducibly read in a set of data files in a consistent way as part of an analysis workflow.\n", - "This approach streamlines the transition between data sources (local/downloaded files or, ultimately, cloud/bucket access) and data object types (e.g. [Xarray Dataset](http://xarray.pydata.org/en/stable/generated/xarray.Dataset.html) or [GeoPandas GeoDataFrame](https://geopandas.org/docs/reference/api/geopandas.GeoDataFrame.html))." + "If you're interested in what's happening under the hood: icepyx uses the [xarray](https://docs.xarray.dev/en/stable/) library to read in each of the requested variables of the dataset. icepyx formats each requested variable and then merges the read-in data from each of the variables to create a single data object. The use of xarray is powerful, because the returned data object can be used with relevant xarray processing tools." ] }, { From d019b9a2db2391882dbc69c4816f64eb03f389e3 Mon Sep 17 00:00:00 2001 From: Rachel Wegener Date: Wed, 30 Aug 2023 20:59:03 +0000 Subject: [PATCH 08/30] remove one more instance of catalog from the docs --- doc/source/example_notebooks/IS2_data_read-in.ipynb | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/doc/source/example_notebooks/IS2_data_read-in.ipynb b/doc/source/example_notebooks/IS2_data_read-in.ipynb index c459b7c78..13b49cddb 100644 --- a/doc/source/example_notebooks/IS2_data_read-in.ipynb +++ b/doc/source/example_notebooks/IS2_data_read-in.ipynb @@ -2470,8 +2470,7 @@ "source": [ "#### Credits\n", "* original notebook by: Jessica Scheick\n", - "* notebook contributors: Wei Ji and Tian\n", - "* templates for default ICESat-2 Intake catalogs from: [Wei Ji](https://github.com/icesat2py/icepyx/issues/106) and [Tian](https://github.com/icetianli/ICESat2_xarray)." + "* notebook contributors: Wei Ji and Tian" ] }, { From 156ea89103f44dd4b7be680ac51eecb5e1b85b18 Mon Sep 17 00:00:00 2001 From: Rachel Wegener Date: Wed, 30 Aug 2023 21:01:36 +0000 Subject: [PATCH 09/30] clear jupyter history --- .../example_notebooks/IS2_data_read-in.ipynb | 2019 +---------------- 1 file changed, 34 insertions(+), 1985 deletions(-) diff --git a/doc/source/example_notebooks/IS2_data_read-in.ipynb b/doc/source/example_notebooks/IS2_data_read-in.ipynb index 13b49cddb..115c63044 100644 --- a/doc/source/example_notebooks/IS2_data_read-in.ipynb +++ b/doc/source/example_notebooks/IS2_data_read-in.ipynb @@ -35,7 +35,7 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": null, "id": "2b74b672", "metadata": {}, "outputs": [], @@ -58,18 +58,10 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": null, "id": "c4390195", "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "You have 6 files matching the filename pattern to be read in.\n" - ] - } - ], + "outputs": [], "source": [ "path_root = '/full/path/to/your/data/'\n", "pattern = \"processed_ATL{product:2}_{datetime:%Y%m%d%H%M%S}_{rgt:4}{cycle:2}{orbitsegment:2}_{version:3}_{revision:2}.h5\"\n", @@ -78,7 +70,7 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": null, "id": "2f46029d", "metadata": {}, "outputs": [], @@ -88,603 +80,10 @@ }, { "cell_type": "code", - "execution_count": 7, + "execution_count": null, "id": "c0439388", "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", - " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", - " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", - " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", - " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", - " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", - " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", - " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", - " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", - " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", - " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", - " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", - " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n" - ] - }, - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "
<xarray.Dataset>\n",
-       "Dimensions:              (photon_idx: 29027, spot: 2, gran_idx: 6)\n",
-       "Coordinates:\n",
-       "  * photon_idx           (photon_idx) int64 0 1 2 3 ... 29023 29024 29025 29026\n",
-       "  * spot                 (spot) uint8 2 5\n",
-       "  * gran_idx             (gran_idx) float64 8.49e+04 9.02e+04 ... 1.016e+05\n",
-       "    source_file          (gran_idx) <U72 '../../../../data/ATL06/processed_AT...\n",
-       "    delta_time           (gran_idx, photon_idx) datetime64[ns] 2019-02-22T01:...\n",
-       "Data variables:\n",
-       "    sc_orient            (gran_idx) int8 0 0 0 1 1 1\n",
-       "    cycle_number         (gran_idx) int8 2 2 2 5 5 5\n",
-       "    rgt                  (gran_idx) int16 849 902 910 986 1001 1016\n",
-       "    atlas_sdp_gps_epoch  (gran_idx) datetime64[ns] 2018-01-01T00:00:18 ... 20...\n",
-       "    data_start_utc       (gran_idx) datetime64[ns] 2019-02-22T01:03:44.199777...\n",
-       "    data_end_utc         (gran_idx) datetime64[ns] 2019-02-22T01:07:38.112326...\n",
-       "    h_li                 (spot, gran_idx, photon_idx) float32 nan nan ... nan\n",
-       "    latitude             (spot, gran_idx, photon_idx) float64 nan nan ... nan\n",
-       "    longitude            (spot, gran_idx, photon_idx) float64 nan nan ... nan\n",
-       "    gt                   (gran_idx, spot) <U4 'gt3r' 'gt1l' ... 'gt1l' 'gt3r'\n",
-       "Attributes:\n",
-       "    data_product:  ATL06\n",
-       "    Description:   The land_ice_height group contains the primary set of deri...\n",
-       "    data_rate:     Data within this group are sparse.  Data values are provid...
" - ], - "text/plain": [ - "\n", - "Dimensions: (photon_idx: 29027, spot: 2, gran_idx: 6)\n", - "Coordinates:\n", - " * photon_idx (photon_idx) int64 0 1 2 3 ... 29023 29024 29025 29026\n", - " * spot (spot) uint8 2 5\n", - " * gran_idx (gran_idx) float64 8.49e+04 9.02e+04 ... 1.016e+05\n", - " source_file (gran_idx) " - ] - }, - "execution_count": 8, - "metadata": {}, - "output_type": "execute_result" - }, - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "ds.plot.scatter(x=\"longitude\", y=\"latitude\", hue=\"h_li\", vmin=-100, vmax=2000)" ] @@ -754,7 +132,7 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": null, "id": "63da2b3c", "metadata": {}, "outputs": [], @@ -765,24 +143,10 @@ }, { "cell_type": "code", - "execution_count": 10, + "execution_count": null, "id": "e6f7c047", "metadata": {}, - "outputs": [ - { - "ename": "AttributeError", - "evalue": "'Query' object has no attribute '_session'", - "output_type": "error", - "traceback": [ - "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", - "\u001b[0;31mAttributeError\u001b[0m Traceback (most recent call last)", - "Cell \u001b[0;32mIn[10], line 1\u001b[0m\n\u001b[0;32m----> 1\u001b[0m \u001b[43mregion_a\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mdownload_granules\u001b[49m\u001b[43m(\u001b[49m\u001b[43mpath\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mpath_root\u001b[49m\u001b[43m)\u001b[49m\n", - "File \u001b[0;32m~/envs/general/lib/python3.11/site-packages/icepyx/core/query.py:1129\u001b[0m, in \u001b[0;36mQuery.download_granules\u001b[0;34m(self, path, verbose, subset, restart, **kwargs)\u001b[0m\n\u001b[1;32m 1124\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[1;32m 1125\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m (\n\u001b[1;32m 1126\u001b[0m \u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;28mhasattr\u001b[39m(\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_granules, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124morderIDs\u001b[39m\u001b[38;5;124m\"\u001b[39m)\n\u001b[1;32m 1127\u001b[0m \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;28mlen\u001b[39m(\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_granules\u001b[38;5;241m.\u001b[39morderIDs) \u001b[38;5;241m==\u001b[39m \u001b[38;5;241m0\u001b[39m\n\u001b[1;32m 1128\u001b[0m ):\n\u001b[0;32m-> 1129\u001b[0m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43morder_granules\u001b[49m\u001b[43m(\u001b[49m\u001b[43mverbose\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mverbose\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43msubset\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43msubset\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 1131\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_granules\u001b[38;5;241m.\u001b[39mdownload(verbose, path, session\u001b[38;5;241m=\u001b[39m\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_session, restart\u001b[38;5;241m=\u001b[39mrestart)\n", - "File \u001b[0;32m~/envs/general/lib/python3.11/site-packages/icepyx/core/query.py:1065\u001b[0m, in \u001b[0;36mQuery.order_granules\u001b[0;34m(self, verbose, subset, email, **kwargs)\u001b[0m\n\u001b[1;32m 1048\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_granules\u001b[38;5;241m.\u001b[39mplace_order(\n\u001b[1;32m 1049\u001b[0m tempCMRparams,\n\u001b[1;32m 1050\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mreqparams,\n\u001b[0;32m (...)\u001b[0m\n\u001b[1;32m 1055\u001b[0m geom_filepath\u001b[38;5;241m=\u001b[39m\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_spatial\u001b[38;5;241m.\u001b[39m_geom_file,\n\u001b[1;32m 1056\u001b[0m )\n\u001b[1;32m 1058\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[1;32m 1059\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_granules\u001b[38;5;241m.\u001b[39mplace_order(\n\u001b[1;32m 1060\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mCMRparams,\n\u001b[1;32m 1061\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mreqparams,\n\u001b[1;32m 1062\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39msubsetparams(\u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs),\n\u001b[1;32m 1063\u001b[0m verbose,\n\u001b[1;32m 1064\u001b[0m subset,\n\u001b[0;32m-> 1065\u001b[0m session\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_session\u001b[49m,\n\u001b[1;32m 1066\u001b[0m geom_filepath\u001b[38;5;241m=\u001b[39m\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_spatial\u001b[38;5;241m.\u001b[39m_geom_file,\n\u001b[1;32m 1067\u001b[0m )\n", - "\u001b[0;31mAttributeError\u001b[0m: 'Query' object has no attribute '_session'" - ] - } - ], + "outputs": [], "source": [ "region_a.download_granules(path=path_root)" ] @@ -823,7 +187,7 @@ }, { "cell_type": "code", - "execution_count": 11, + "execution_count": null, "id": "9cde6679", "metadata": {}, "outputs": [], @@ -833,7 +197,7 @@ }, { "cell_type": "code", - "execution_count": 13, + "execution_count": null, "id": "8b6edf0c", "metadata": {}, "outputs": [], @@ -843,7 +207,7 @@ }, { "cell_type": "code", - "execution_count": 14, + "execution_count": null, "id": "e683ebf7", "metadata": {}, "outputs": [], @@ -870,7 +234,7 @@ }, { "cell_type": "code", - "execution_count": 15, + "execution_count": null, "id": "7318abd0", "metadata": {}, "outputs": [], @@ -881,7 +245,7 @@ }, { "cell_type": "code", - "execution_count": 16, + "execution_count": null, "id": "f43e8664", "metadata": {}, "outputs": [], @@ -891,7 +255,7 @@ }, { "cell_type": "code", - "execution_count": 17, + "execution_count": null, "id": "992a77fb", "metadata": {}, "outputs": [], @@ -901,7 +265,7 @@ }, { "cell_type": "code", - "execution_count": 18, + "execution_count": null, "id": "6aec1a70", "metadata": {}, "outputs": [], @@ -928,46 +292,22 @@ }, { "cell_type": "code", - "execution_count": 19, + "execution_count": null, "id": "39bd7eb8", "metadata": { "scrolled": true }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "You have 6 files matching the filename pattern to be read in.\n" - ] - } - ], + "outputs": [], "source": [ "reader = ipx.Read(data_source=path_root, product=\"ATL06\", filename_pattern=pattern) # or ipx.Read(filepath, \"ATLXX\") if your filenames match the default pattern" ] }, { "cell_type": "code", - "execution_count": 20, + "execution_count": null, "id": "6c9ebc4a", "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "['../../../../data/ATL06/processed_ATL06_20190226005526_09100205_006_02.h5',\n", - " '../../../../data/ATL06/processed_ATL06_20191201105502_10010505_006_01.h5',\n", - " '../../../../data/ATL06/processed_ATL06_20190225121032_09020203_006_02.h5',\n", - " '../../../../data/ATL06/processed_ATL06_20190222010344_08490205_006_02.h5',\n", - " '../../../../data/ATL06/processed_ATL06_20191130112041_09860505_006_01.h5',\n", - " '../../../../data/ATL06/processed_ATL06_20191202102922_10160505_006_01.h5']" - ] - }, - "execution_count": 20, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "reader._filelist" ] @@ -990,616 +330,12 @@ }, { "cell_type": "code", - "execution_count": 21, + "execution_count": null, "id": "18f65f67", "metadata": { "scrolled": true }, - "outputs": [ - { - "data": { - "text/plain": [ - "['ancillary_data/atlas_sdp_gps_epoch',\n", - " 'ancillary_data/control',\n", - " 'ancillary_data/data_end_utc',\n", - " 'ancillary_data/data_start_utc',\n", - " 'ancillary_data/end_cycle',\n", - " 'ancillary_data/end_delta_time',\n", - " 'ancillary_data/end_geoseg',\n", - " 'ancillary_data/end_gpssow',\n", - " 'ancillary_data/end_gpsweek',\n", - " 'ancillary_data/end_orbit',\n", - " 'ancillary_data/end_region',\n", - " 'ancillary_data/end_rgt',\n", - " 'ancillary_data/granule_end_utc',\n", - " 'ancillary_data/granule_start_utc',\n", - " 'ancillary_data/land_ice/dt_hist',\n", - " 'ancillary_data/land_ice/fit_maxiter',\n", - " 'ancillary_data/land_ice/fpb_maxiter',\n", - " 'ancillary_data/land_ice/max_res_ids',\n", - " 'ancillary_data/land_ice/min_dist',\n", - " 'ancillary_data/land_ice/min_gain_th',\n", - " 'ancillary_data/land_ice/min_n_pe',\n", - " 'ancillary_data/land_ice/min_n_sel',\n", - " 'ancillary_data/land_ice/min_signal_conf',\n", - " 'ancillary_data/land_ice/n_hist',\n", - " 'ancillary_data/land_ice/n_sigmas',\n", - " 'ancillary_data/land_ice/nhist_bins',\n", - " 'ancillary_data/land_ice/proc_interval',\n", - " 'ancillary_data/land_ice/qs_lim_bsc',\n", - " 'ancillary_data/land_ice/qs_lim_hrs',\n", - " 'ancillary_data/land_ice/qs_lim_hsigma',\n", - " 'ancillary_data/land_ice/qs_lim_msw',\n", - " 'ancillary_data/land_ice/qs_lim_snr',\n", - " 'ancillary_data/land_ice/qs_lim_sss',\n", - " 'ancillary_data/land_ice/rbin_width',\n", - " 'ancillary_data/land_ice/sigma_beam',\n", - " 'ancillary_data/land_ice/sigma_tx',\n", - " 'ancillary_data/land_ice/t_dead',\n", - " 'ancillary_data/land_ice/txp_maxiter',\n", - " 'ancillary_data/qa_at_interval',\n", - " 'ancillary_data/release',\n", - " 'ancillary_data/start_cycle',\n", - " 'ancillary_data/start_delta_time',\n", - " 'ancillary_data/start_geoseg',\n", - " 'ancillary_data/start_gpssow',\n", - " 'ancillary_data/start_gpsweek',\n", - " 'ancillary_data/start_orbit',\n", - " 'ancillary_data/start_region',\n", - " 'ancillary_data/start_rgt',\n", - " 'ancillary_data/version',\n", - " 'gt1l/land_ice_segments/atl06_quality_summary',\n", - " 'gt1l/land_ice_segments/bias_correction/fpb_mean_corr',\n", - " 'gt1l/land_ice_segments/bias_correction/fpb_mean_corr_sigma',\n", - " 'gt1l/land_ice_segments/bias_correction/fpb_med_corr',\n", - " 'gt1l/land_ice_segments/bias_correction/fpb_med_corr_sigma',\n", - " 'gt1l/land_ice_segments/bias_correction/fpb_n_corr',\n", - " 'gt1l/land_ice_segments/bias_correction/med_r_fit',\n", - " 'gt1l/land_ice_segments/bias_correction/tx_mean_corr',\n", - " 'gt1l/land_ice_segments/bias_correction/tx_med_corr',\n", - " 'gt1l/land_ice_segments/delta_time',\n", - " 'gt1l/land_ice_segments/dem/dem_flag',\n", - " 'gt1l/land_ice_segments/dem/dem_h',\n", - " 'gt1l/land_ice_segments/dem/geoid_free2mean',\n", - " 'gt1l/land_ice_segments/dem/geoid_h',\n", - " 'gt1l/land_ice_segments/fit_statistics/dh_fit_dx',\n", - " 'gt1l/land_ice_segments/fit_statistics/dh_fit_dx_sigma',\n", - " 'gt1l/land_ice_segments/fit_statistics/dh_fit_dy',\n", - " 'gt1l/land_ice_segments/fit_statistics/h_expected_rms',\n", - " 'gt1l/land_ice_segments/fit_statistics/h_mean',\n", - " 'gt1l/land_ice_segments/fit_statistics/h_rms_misfit',\n", - " 'gt1l/land_ice_segments/fit_statistics/h_robust_sprd',\n", - " 'gt1l/land_ice_segments/fit_statistics/n_fit_photons',\n", - " 'gt1l/land_ice_segments/fit_statistics/n_seg_pulses',\n", - " 'gt1l/land_ice_segments/fit_statistics/sigma_h_mean',\n", - " 'gt1l/land_ice_segments/fit_statistics/signal_selection_source',\n", - " 'gt1l/land_ice_segments/fit_statistics/signal_selection_source_status',\n", - " 'gt1l/land_ice_segments/fit_statistics/snr',\n", - " 'gt1l/land_ice_segments/fit_statistics/snr_significance',\n", - " 'gt1l/land_ice_segments/fit_statistics/w_surface_window_final',\n", - " 'gt1l/land_ice_segments/geophysical/bckgrd',\n", - " 'gt1l/land_ice_segments/geophysical/bsnow_conf',\n", - " 'gt1l/land_ice_segments/geophysical/bsnow_h',\n", - " 'gt1l/land_ice_segments/geophysical/bsnow_od',\n", - " 'gt1l/land_ice_segments/geophysical/cloud_flg_asr',\n", - " 'gt1l/land_ice_segments/geophysical/cloud_flg_atm',\n", - " 'gt1l/land_ice_segments/geophysical/dac',\n", - " 'gt1l/land_ice_segments/geophysical/e_bckgrd',\n", - " 'gt1l/land_ice_segments/geophysical/layer_flag',\n", - " 'gt1l/land_ice_segments/geophysical/msw_flag',\n", - " 'gt1l/land_ice_segments/geophysical/neutat_delay_total',\n", - " 'gt1l/land_ice_segments/geophysical/r_eff',\n", - " 'gt1l/land_ice_segments/geophysical/solar_azimuth',\n", - " 'gt1l/land_ice_segments/geophysical/solar_elevation',\n", - " 'gt1l/land_ice_segments/geophysical/tide_earth',\n", - " 'gt1l/land_ice_segments/geophysical/tide_earth_free2mean',\n", - " 'gt1l/land_ice_segments/geophysical/tide_equilibrium',\n", - " 'gt1l/land_ice_segments/geophysical/tide_load',\n", - " 'gt1l/land_ice_segments/geophysical/tide_ocean',\n", - " 'gt1l/land_ice_segments/geophysical/tide_pole',\n", - " 'gt1l/land_ice_segments/ground_track/ref_azimuth',\n", - " 'gt1l/land_ice_segments/ground_track/ref_coelv',\n", - " 'gt1l/land_ice_segments/ground_track/seg_azimuth',\n", - " 'gt1l/land_ice_segments/ground_track/sigma_geo_at',\n", - " 'gt1l/land_ice_segments/ground_track/sigma_geo_r',\n", - " 'gt1l/land_ice_segments/ground_track/sigma_geo_xt',\n", - " 'gt1l/land_ice_segments/ground_track/x_atc',\n", - " 'gt1l/land_ice_segments/ground_track/y_atc',\n", - " 'gt1l/land_ice_segments/h_li',\n", - " 'gt1l/land_ice_segments/h_li_sigma',\n", - " 'gt1l/land_ice_segments/latitude',\n", - " 'gt1l/land_ice_segments/longitude',\n", - " 'gt1l/land_ice_segments/segment_id',\n", - " 'gt1l/land_ice_segments/sigma_geo_h',\n", - " 'gt1l/residual_histogram/bckgrd_per_m',\n", - " 'gt1l/residual_histogram/bin_top_h',\n", - " 'gt1l/residual_histogram/count',\n", - " 'gt1l/residual_histogram/delta_time',\n", - " 'gt1l/residual_histogram/ds_segment_id',\n", - " 'gt1l/residual_histogram/lat_mean',\n", - " 'gt1l/residual_histogram/lon_mean',\n", - " 'gt1l/residual_histogram/pulse_count',\n", - " 'gt1l/residual_histogram/segment_id_list',\n", - " 'gt1l/residual_histogram/x_atc_mean',\n", - " 'gt1l/segment_quality/delta_time',\n", - " 'gt1l/segment_quality/record_number',\n", - " 'gt1l/segment_quality/reference_pt_lat',\n", - " 'gt1l/segment_quality/reference_pt_lon',\n", - " 'gt1l/segment_quality/segment_id',\n", - " 'gt1l/segment_quality/signal_selection_source',\n", - " 'gt1l/segment_quality/signal_selection_status/signal_selection_status_all',\n", - " 'gt1l/segment_quality/signal_selection_status/signal_selection_status_backup',\n", - " 'gt1l/segment_quality/signal_selection_status/signal_selection_status_confident',\n", - " 'gt1r/land_ice_segments/atl06_quality_summary',\n", - " 'gt1r/land_ice_segments/bias_correction/fpb_mean_corr',\n", - " 'gt1r/land_ice_segments/bias_correction/fpb_mean_corr_sigma',\n", - " 'gt1r/land_ice_segments/bias_correction/fpb_med_corr',\n", - " 'gt1r/land_ice_segments/bias_correction/fpb_med_corr_sigma',\n", - " 'gt1r/land_ice_segments/bias_correction/fpb_n_corr',\n", - " 'gt1r/land_ice_segments/bias_correction/med_r_fit',\n", - " 'gt1r/land_ice_segments/bias_correction/tx_mean_corr',\n", - " 'gt1r/land_ice_segments/bias_correction/tx_med_corr',\n", - " 'gt1r/land_ice_segments/delta_time',\n", - " 'gt1r/land_ice_segments/dem/dem_flag',\n", - " 'gt1r/land_ice_segments/dem/dem_h',\n", - " 'gt1r/land_ice_segments/dem/geoid_free2mean',\n", - " 'gt1r/land_ice_segments/dem/geoid_h',\n", - " 'gt1r/land_ice_segments/fit_statistics/dh_fit_dx',\n", - " 'gt1r/land_ice_segments/fit_statistics/dh_fit_dx_sigma',\n", - " 'gt1r/land_ice_segments/fit_statistics/dh_fit_dy',\n", - " 'gt1r/land_ice_segments/fit_statistics/h_expected_rms',\n", - " 'gt1r/land_ice_segments/fit_statistics/h_mean',\n", - " 'gt1r/land_ice_segments/fit_statistics/h_rms_misfit',\n", - " 'gt1r/land_ice_segments/fit_statistics/h_robust_sprd',\n", - " 'gt1r/land_ice_segments/fit_statistics/n_fit_photons',\n", - " 'gt1r/land_ice_segments/fit_statistics/n_seg_pulses',\n", - " 'gt1r/land_ice_segments/fit_statistics/sigma_h_mean',\n", - " 'gt1r/land_ice_segments/fit_statistics/signal_selection_source',\n", - " 'gt1r/land_ice_segments/fit_statistics/signal_selection_source_status',\n", - " 'gt1r/land_ice_segments/fit_statistics/snr',\n", - " 'gt1r/land_ice_segments/fit_statistics/snr_significance',\n", - " 'gt1r/land_ice_segments/fit_statistics/w_surface_window_final',\n", - " 'gt1r/land_ice_segments/geophysical/bckgrd',\n", - " 'gt1r/land_ice_segments/geophysical/bsnow_conf',\n", - " 'gt1r/land_ice_segments/geophysical/bsnow_h',\n", - " 'gt1r/land_ice_segments/geophysical/bsnow_od',\n", - " 'gt1r/land_ice_segments/geophysical/cloud_flg_asr',\n", - " 'gt1r/land_ice_segments/geophysical/cloud_flg_atm',\n", - " 'gt1r/land_ice_segments/geophysical/dac',\n", - " 'gt1r/land_ice_segments/geophysical/e_bckgrd',\n", - " 'gt1r/land_ice_segments/geophysical/layer_flag',\n", - " 'gt1r/land_ice_segments/geophysical/msw_flag',\n", - " 'gt1r/land_ice_segments/geophysical/neutat_delay_total',\n", - " 'gt1r/land_ice_segments/geophysical/r_eff',\n", - " 'gt1r/land_ice_segments/geophysical/solar_azimuth',\n", - " 'gt1r/land_ice_segments/geophysical/solar_elevation',\n", - " 'gt1r/land_ice_segments/geophysical/tide_earth',\n", - " 'gt1r/land_ice_segments/geophysical/tide_earth_free2mean',\n", - " 'gt1r/land_ice_segments/geophysical/tide_equilibrium',\n", - " 'gt1r/land_ice_segments/geophysical/tide_load',\n", - " 'gt1r/land_ice_segments/geophysical/tide_ocean',\n", - " 'gt1r/land_ice_segments/geophysical/tide_pole',\n", - " 'gt1r/land_ice_segments/ground_track/ref_azimuth',\n", - " 'gt1r/land_ice_segments/ground_track/ref_coelv',\n", - " 'gt1r/land_ice_segments/ground_track/seg_azimuth',\n", - " 'gt1r/land_ice_segments/ground_track/sigma_geo_at',\n", - " 'gt1r/land_ice_segments/ground_track/sigma_geo_r',\n", - " 'gt1r/land_ice_segments/ground_track/sigma_geo_xt',\n", - " 'gt1r/land_ice_segments/ground_track/x_atc',\n", - " 'gt1r/land_ice_segments/ground_track/y_atc',\n", - " 'gt1r/land_ice_segments/h_li',\n", - " 'gt1r/land_ice_segments/h_li_sigma',\n", - " 'gt1r/land_ice_segments/latitude',\n", - " 'gt1r/land_ice_segments/longitude',\n", - " 'gt1r/land_ice_segments/segment_id',\n", - " 'gt1r/land_ice_segments/sigma_geo_h',\n", - " 'gt1r/residual_histogram/bckgrd_per_m',\n", - " 'gt1r/residual_histogram/bin_top_h',\n", - " 'gt1r/residual_histogram/count',\n", - " 'gt1r/residual_histogram/delta_time',\n", - " 'gt1r/residual_histogram/ds_segment_id',\n", - " 'gt1r/residual_histogram/lat_mean',\n", - " 'gt1r/residual_histogram/lon_mean',\n", - " 'gt1r/residual_histogram/pulse_count',\n", - " 'gt1r/residual_histogram/segment_id_list',\n", - " 'gt1r/residual_histogram/x_atc_mean',\n", - " 'gt1r/segment_quality/delta_time',\n", - " 'gt1r/segment_quality/record_number',\n", - " 'gt1r/segment_quality/reference_pt_lat',\n", - " 'gt1r/segment_quality/reference_pt_lon',\n", - " 'gt1r/segment_quality/segment_id',\n", - " 'gt1r/segment_quality/signal_selection_source',\n", - " 'gt1r/segment_quality/signal_selection_status/signal_selection_status_all',\n", - " 'gt1r/segment_quality/signal_selection_status/signal_selection_status_backup',\n", - " 'gt1r/segment_quality/signal_selection_status/signal_selection_status_confident',\n", - " 'gt2l/land_ice_segments/atl06_quality_summary',\n", - " 'gt2l/land_ice_segments/bias_correction/fpb_mean_corr',\n", - " 'gt2l/land_ice_segments/bias_correction/fpb_mean_corr_sigma',\n", - " 'gt2l/land_ice_segments/bias_correction/fpb_med_corr',\n", - " 'gt2l/land_ice_segments/bias_correction/fpb_med_corr_sigma',\n", - " 'gt2l/land_ice_segments/bias_correction/fpb_n_corr',\n", - " 'gt2l/land_ice_segments/bias_correction/med_r_fit',\n", - " 'gt2l/land_ice_segments/bias_correction/tx_mean_corr',\n", - " 'gt2l/land_ice_segments/bias_correction/tx_med_corr',\n", - " 'gt2l/land_ice_segments/delta_time',\n", - " 'gt2l/land_ice_segments/dem/dem_flag',\n", - " 'gt2l/land_ice_segments/dem/dem_h',\n", - " 'gt2l/land_ice_segments/dem/geoid_free2mean',\n", - " 'gt2l/land_ice_segments/dem/geoid_h',\n", - " 'gt2l/land_ice_segments/fit_statistics/dh_fit_dx',\n", - " 'gt2l/land_ice_segments/fit_statistics/dh_fit_dx_sigma',\n", - " 'gt2l/land_ice_segments/fit_statistics/dh_fit_dy',\n", - " 'gt2l/land_ice_segments/fit_statistics/h_expected_rms',\n", - " 'gt2l/land_ice_segments/fit_statistics/h_mean',\n", - " 'gt2l/land_ice_segments/fit_statistics/h_rms_misfit',\n", - " 'gt2l/land_ice_segments/fit_statistics/h_robust_sprd',\n", - " 'gt2l/land_ice_segments/fit_statistics/n_fit_photons',\n", - " 'gt2l/land_ice_segments/fit_statistics/n_seg_pulses',\n", - " 'gt2l/land_ice_segments/fit_statistics/sigma_h_mean',\n", - " 'gt2l/land_ice_segments/fit_statistics/signal_selection_source',\n", - " 'gt2l/land_ice_segments/fit_statistics/signal_selection_source_status',\n", - " 'gt2l/land_ice_segments/fit_statistics/snr',\n", - " 'gt2l/land_ice_segments/fit_statistics/snr_significance',\n", - " 'gt2l/land_ice_segments/fit_statistics/w_surface_window_final',\n", - " 'gt2l/land_ice_segments/geophysical/bckgrd',\n", - " 'gt2l/land_ice_segments/geophysical/bsnow_conf',\n", - " 'gt2l/land_ice_segments/geophysical/bsnow_h',\n", - " 'gt2l/land_ice_segments/geophysical/bsnow_od',\n", - " 'gt2l/land_ice_segments/geophysical/cloud_flg_asr',\n", - " 'gt2l/land_ice_segments/geophysical/cloud_flg_atm',\n", - " 'gt2l/land_ice_segments/geophysical/dac',\n", - " 'gt2l/land_ice_segments/geophysical/e_bckgrd',\n", - " 'gt2l/land_ice_segments/geophysical/layer_flag',\n", - " 'gt2l/land_ice_segments/geophysical/msw_flag',\n", - " 'gt2l/land_ice_segments/geophysical/neutat_delay_total',\n", - " 'gt2l/land_ice_segments/geophysical/r_eff',\n", - " 'gt2l/land_ice_segments/geophysical/solar_azimuth',\n", - " 'gt2l/land_ice_segments/geophysical/solar_elevation',\n", - " 'gt2l/land_ice_segments/geophysical/tide_earth',\n", - " 'gt2l/land_ice_segments/geophysical/tide_earth_free2mean',\n", - " 'gt2l/land_ice_segments/geophysical/tide_equilibrium',\n", - " 'gt2l/land_ice_segments/geophysical/tide_load',\n", - " 'gt2l/land_ice_segments/geophysical/tide_ocean',\n", - " 'gt2l/land_ice_segments/geophysical/tide_pole',\n", - " 'gt2l/land_ice_segments/ground_track/ref_azimuth',\n", - " 'gt2l/land_ice_segments/ground_track/ref_coelv',\n", - " 'gt2l/land_ice_segments/ground_track/seg_azimuth',\n", - " 'gt2l/land_ice_segments/ground_track/sigma_geo_at',\n", - " 'gt2l/land_ice_segments/ground_track/sigma_geo_r',\n", - " 'gt2l/land_ice_segments/ground_track/sigma_geo_xt',\n", - " 'gt2l/land_ice_segments/ground_track/x_atc',\n", - " 'gt2l/land_ice_segments/ground_track/y_atc',\n", - " 'gt2l/land_ice_segments/h_li',\n", - " 'gt2l/land_ice_segments/h_li_sigma',\n", - " 'gt2l/land_ice_segments/latitude',\n", - " 'gt2l/land_ice_segments/longitude',\n", - " 'gt2l/land_ice_segments/segment_id',\n", - " 'gt2l/land_ice_segments/sigma_geo_h',\n", - " 'gt2l/residual_histogram/bckgrd_per_m',\n", - " 'gt2l/residual_histogram/bin_top_h',\n", - " 'gt2l/residual_histogram/count',\n", - " 'gt2l/residual_histogram/delta_time',\n", - " 'gt2l/residual_histogram/ds_segment_id',\n", - " 'gt2l/residual_histogram/lat_mean',\n", - " 'gt2l/residual_histogram/lon_mean',\n", - " 'gt2l/residual_histogram/pulse_count',\n", - " 'gt2l/residual_histogram/segment_id_list',\n", - " 'gt2l/residual_histogram/x_atc_mean',\n", - " 'gt2l/segment_quality/delta_time',\n", - " 'gt2l/segment_quality/record_number',\n", - " 'gt2l/segment_quality/reference_pt_lat',\n", - " 'gt2l/segment_quality/reference_pt_lon',\n", - " 'gt2l/segment_quality/segment_id',\n", - " 'gt2l/segment_quality/signal_selection_source',\n", - " 'gt2l/segment_quality/signal_selection_status/signal_selection_status_all',\n", - " 'gt2l/segment_quality/signal_selection_status/signal_selection_status_backup',\n", - " 'gt2l/segment_quality/signal_selection_status/signal_selection_status_confident',\n", - " 'gt2r/land_ice_segments/atl06_quality_summary',\n", - " 'gt2r/land_ice_segments/bias_correction/fpb_mean_corr',\n", - " 'gt2r/land_ice_segments/bias_correction/fpb_mean_corr_sigma',\n", - " 'gt2r/land_ice_segments/bias_correction/fpb_med_corr',\n", - " 'gt2r/land_ice_segments/bias_correction/fpb_med_corr_sigma',\n", - " 'gt2r/land_ice_segments/bias_correction/fpb_n_corr',\n", - " 'gt2r/land_ice_segments/bias_correction/med_r_fit',\n", - " 'gt2r/land_ice_segments/bias_correction/tx_mean_corr',\n", - " 'gt2r/land_ice_segments/bias_correction/tx_med_corr',\n", - " 'gt2r/land_ice_segments/delta_time',\n", - " 'gt2r/land_ice_segments/dem/dem_flag',\n", - " 'gt2r/land_ice_segments/dem/dem_h',\n", - " 'gt2r/land_ice_segments/dem/geoid_free2mean',\n", - " 'gt2r/land_ice_segments/dem/geoid_h',\n", - " 'gt2r/land_ice_segments/fit_statistics/dh_fit_dx',\n", - " 'gt2r/land_ice_segments/fit_statistics/dh_fit_dx_sigma',\n", - " 'gt2r/land_ice_segments/fit_statistics/dh_fit_dy',\n", - " 'gt2r/land_ice_segments/fit_statistics/h_expected_rms',\n", - " 'gt2r/land_ice_segments/fit_statistics/h_mean',\n", - " 'gt2r/land_ice_segments/fit_statistics/h_rms_misfit',\n", - " 'gt2r/land_ice_segments/fit_statistics/h_robust_sprd',\n", - " 'gt2r/land_ice_segments/fit_statistics/n_fit_photons',\n", - " 'gt2r/land_ice_segments/fit_statistics/n_seg_pulses',\n", - " 'gt2r/land_ice_segments/fit_statistics/sigma_h_mean',\n", - " 'gt2r/land_ice_segments/fit_statistics/signal_selection_source',\n", - " 'gt2r/land_ice_segments/fit_statistics/signal_selection_source_status',\n", - " 'gt2r/land_ice_segments/fit_statistics/snr',\n", - " 'gt2r/land_ice_segments/fit_statistics/snr_significance',\n", - " 'gt2r/land_ice_segments/fit_statistics/w_surface_window_final',\n", - " 'gt2r/land_ice_segments/geophysical/bckgrd',\n", - " 'gt2r/land_ice_segments/geophysical/bsnow_conf',\n", - " 'gt2r/land_ice_segments/geophysical/bsnow_h',\n", - " 'gt2r/land_ice_segments/geophysical/bsnow_od',\n", - " 'gt2r/land_ice_segments/geophysical/cloud_flg_asr',\n", - " 'gt2r/land_ice_segments/geophysical/cloud_flg_atm',\n", - " 'gt2r/land_ice_segments/geophysical/dac',\n", - " 'gt2r/land_ice_segments/geophysical/e_bckgrd',\n", - " 'gt2r/land_ice_segments/geophysical/layer_flag',\n", - " 'gt2r/land_ice_segments/geophysical/msw_flag',\n", - " 'gt2r/land_ice_segments/geophysical/neutat_delay_total',\n", - " 'gt2r/land_ice_segments/geophysical/r_eff',\n", - " 'gt2r/land_ice_segments/geophysical/solar_azimuth',\n", - " 'gt2r/land_ice_segments/geophysical/solar_elevation',\n", - " 'gt2r/land_ice_segments/geophysical/tide_earth',\n", - " 'gt2r/land_ice_segments/geophysical/tide_earth_free2mean',\n", - " 'gt2r/land_ice_segments/geophysical/tide_equilibrium',\n", - " 'gt2r/land_ice_segments/geophysical/tide_load',\n", - " 'gt2r/land_ice_segments/geophysical/tide_ocean',\n", - " 'gt2r/land_ice_segments/geophysical/tide_pole',\n", - " 'gt2r/land_ice_segments/ground_track/ref_azimuth',\n", - " 'gt2r/land_ice_segments/ground_track/ref_coelv',\n", - " 'gt2r/land_ice_segments/ground_track/seg_azimuth',\n", - " 'gt2r/land_ice_segments/ground_track/sigma_geo_at',\n", - " 'gt2r/land_ice_segments/ground_track/sigma_geo_r',\n", - " 'gt2r/land_ice_segments/ground_track/sigma_geo_xt',\n", - " 'gt2r/land_ice_segments/ground_track/x_atc',\n", - " 'gt2r/land_ice_segments/ground_track/y_atc',\n", - " 'gt2r/land_ice_segments/h_li',\n", - " 'gt2r/land_ice_segments/h_li_sigma',\n", - " 'gt2r/land_ice_segments/latitude',\n", - " 'gt2r/land_ice_segments/longitude',\n", - " 'gt2r/land_ice_segments/segment_id',\n", - " 'gt2r/land_ice_segments/sigma_geo_h',\n", - " 'gt2r/residual_histogram/bckgrd_per_m',\n", - " 'gt2r/residual_histogram/bin_top_h',\n", - " 'gt2r/residual_histogram/count',\n", - " 'gt2r/residual_histogram/delta_time',\n", - " 'gt2r/residual_histogram/ds_segment_id',\n", - " 'gt2r/residual_histogram/lat_mean',\n", - " 'gt2r/residual_histogram/lon_mean',\n", - " 'gt2r/residual_histogram/pulse_count',\n", - " 'gt2r/residual_histogram/segment_id_list',\n", - " 'gt2r/residual_histogram/x_atc_mean',\n", - " 'gt2r/segment_quality/delta_time',\n", - " 'gt2r/segment_quality/record_number',\n", - " 'gt2r/segment_quality/reference_pt_lat',\n", - " 'gt2r/segment_quality/reference_pt_lon',\n", - " 'gt2r/segment_quality/segment_id',\n", - " 'gt2r/segment_quality/signal_selection_source',\n", - " 'gt2r/segment_quality/signal_selection_status/signal_selection_status_all',\n", - " 'gt2r/segment_quality/signal_selection_status/signal_selection_status_backup',\n", - " 'gt2r/segment_quality/signal_selection_status/signal_selection_status_confident',\n", - " 'gt3l/land_ice_segments/atl06_quality_summary',\n", - " 'gt3l/land_ice_segments/bias_correction/fpb_mean_corr',\n", - " 'gt3l/land_ice_segments/bias_correction/fpb_mean_corr_sigma',\n", - " 'gt3l/land_ice_segments/bias_correction/fpb_med_corr',\n", - " 'gt3l/land_ice_segments/bias_correction/fpb_med_corr_sigma',\n", - " 'gt3l/land_ice_segments/bias_correction/fpb_n_corr',\n", - " 'gt3l/land_ice_segments/bias_correction/med_r_fit',\n", - " 'gt3l/land_ice_segments/bias_correction/tx_mean_corr',\n", - " 'gt3l/land_ice_segments/bias_correction/tx_med_corr',\n", - " 'gt3l/land_ice_segments/delta_time',\n", - " 'gt3l/land_ice_segments/dem/dem_flag',\n", - " 'gt3l/land_ice_segments/dem/dem_h',\n", - " 'gt3l/land_ice_segments/dem/geoid_free2mean',\n", - " 'gt3l/land_ice_segments/dem/geoid_h',\n", - " 'gt3l/land_ice_segments/fit_statistics/dh_fit_dx',\n", - " 'gt3l/land_ice_segments/fit_statistics/dh_fit_dx_sigma',\n", - " 'gt3l/land_ice_segments/fit_statistics/dh_fit_dy',\n", - " 'gt3l/land_ice_segments/fit_statistics/h_expected_rms',\n", - " 'gt3l/land_ice_segments/fit_statistics/h_mean',\n", - " 'gt3l/land_ice_segments/fit_statistics/h_rms_misfit',\n", - " 'gt3l/land_ice_segments/fit_statistics/h_robust_sprd',\n", - " 'gt3l/land_ice_segments/fit_statistics/n_fit_photons',\n", - " 'gt3l/land_ice_segments/fit_statistics/n_seg_pulses',\n", - " 'gt3l/land_ice_segments/fit_statistics/sigma_h_mean',\n", - " 'gt3l/land_ice_segments/fit_statistics/signal_selection_source',\n", - " 'gt3l/land_ice_segments/fit_statistics/signal_selection_source_status',\n", - " 'gt3l/land_ice_segments/fit_statistics/snr',\n", - " 'gt3l/land_ice_segments/fit_statistics/snr_significance',\n", - " 'gt3l/land_ice_segments/fit_statistics/w_surface_window_final',\n", - " 'gt3l/land_ice_segments/geophysical/bckgrd',\n", - " 'gt3l/land_ice_segments/geophysical/bsnow_conf',\n", - " 'gt3l/land_ice_segments/geophysical/bsnow_h',\n", - " 'gt3l/land_ice_segments/geophysical/bsnow_od',\n", - " 'gt3l/land_ice_segments/geophysical/cloud_flg_asr',\n", - " 'gt3l/land_ice_segments/geophysical/cloud_flg_atm',\n", - " 'gt3l/land_ice_segments/geophysical/dac',\n", - " 'gt3l/land_ice_segments/geophysical/e_bckgrd',\n", - " 'gt3l/land_ice_segments/geophysical/layer_flag',\n", - " 'gt3l/land_ice_segments/geophysical/msw_flag',\n", - " 'gt3l/land_ice_segments/geophysical/neutat_delay_total',\n", - " 'gt3l/land_ice_segments/geophysical/r_eff',\n", - " 'gt3l/land_ice_segments/geophysical/solar_azimuth',\n", - " 'gt3l/land_ice_segments/geophysical/solar_elevation',\n", - " 'gt3l/land_ice_segments/geophysical/tide_earth',\n", - " 'gt3l/land_ice_segments/geophysical/tide_earth_free2mean',\n", - " 'gt3l/land_ice_segments/geophysical/tide_equilibrium',\n", - " 'gt3l/land_ice_segments/geophysical/tide_load',\n", - " 'gt3l/land_ice_segments/geophysical/tide_ocean',\n", - " 'gt3l/land_ice_segments/geophysical/tide_pole',\n", - " 'gt3l/land_ice_segments/ground_track/ref_azimuth',\n", - " 'gt3l/land_ice_segments/ground_track/ref_coelv',\n", - " 'gt3l/land_ice_segments/ground_track/seg_azimuth',\n", - " 'gt3l/land_ice_segments/ground_track/sigma_geo_at',\n", - " 'gt3l/land_ice_segments/ground_track/sigma_geo_r',\n", - " 'gt3l/land_ice_segments/ground_track/sigma_geo_xt',\n", - " 'gt3l/land_ice_segments/ground_track/x_atc',\n", - " 'gt3l/land_ice_segments/ground_track/y_atc',\n", - " 'gt3l/land_ice_segments/h_li',\n", - " 'gt3l/land_ice_segments/h_li_sigma',\n", - " 'gt3l/land_ice_segments/latitude',\n", - " 'gt3l/land_ice_segments/longitude',\n", - " 'gt3l/land_ice_segments/segment_id',\n", - " 'gt3l/land_ice_segments/sigma_geo_h',\n", - " 'gt3l/residual_histogram/bckgrd_per_m',\n", - " 'gt3l/residual_histogram/bin_top_h',\n", - " 'gt3l/residual_histogram/count',\n", - " 'gt3l/residual_histogram/delta_time',\n", - " 'gt3l/residual_histogram/ds_segment_id',\n", - " 'gt3l/residual_histogram/lat_mean',\n", - " 'gt3l/residual_histogram/lon_mean',\n", - " 'gt3l/residual_histogram/pulse_count',\n", - " 'gt3l/residual_histogram/segment_id_list',\n", - " 'gt3l/residual_histogram/x_atc_mean',\n", - " 'gt3l/segment_quality/delta_time',\n", - " 'gt3l/segment_quality/record_number',\n", - " 'gt3l/segment_quality/reference_pt_lat',\n", - " 'gt3l/segment_quality/reference_pt_lon',\n", - " 'gt3l/segment_quality/segment_id',\n", - " 'gt3l/segment_quality/signal_selection_source',\n", - " 'gt3l/segment_quality/signal_selection_status/signal_selection_status_all',\n", - " 'gt3l/segment_quality/signal_selection_status/signal_selection_status_backup',\n", - " 'gt3l/segment_quality/signal_selection_status/signal_selection_status_confident',\n", - " 'gt3r/land_ice_segments/atl06_quality_summary',\n", - " 'gt3r/land_ice_segments/bias_correction/fpb_mean_corr',\n", - " 'gt3r/land_ice_segments/bias_correction/fpb_mean_corr_sigma',\n", - " 'gt3r/land_ice_segments/bias_correction/fpb_med_corr',\n", - " 'gt3r/land_ice_segments/bias_correction/fpb_med_corr_sigma',\n", - " 'gt3r/land_ice_segments/bias_correction/fpb_n_corr',\n", - " 'gt3r/land_ice_segments/bias_correction/med_r_fit',\n", - " 'gt3r/land_ice_segments/bias_correction/tx_mean_corr',\n", - " 'gt3r/land_ice_segments/bias_correction/tx_med_corr',\n", - " 'gt3r/land_ice_segments/delta_time',\n", - " 'gt3r/land_ice_segments/dem/dem_flag',\n", - " 'gt3r/land_ice_segments/dem/dem_h',\n", - " 'gt3r/land_ice_segments/dem/geoid_free2mean',\n", - " 'gt3r/land_ice_segments/dem/geoid_h',\n", - " 'gt3r/land_ice_segments/fit_statistics/dh_fit_dx',\n", - " 'gt3r/land_ice_segments/fit_statistics/dh_fit_dx_sigma',\n", - " 'gt3r/land_ice_segments/fit_statistics/dh_fit_dy',\n", - " 'gt3r/land_ice_segments/fit_statistics/h_expected_rms',\n", - " 'gt3r/land_ice_segments/fit_statistics/h_mean',\n", - " 'gt3r/land_ice_segments/fit_statistics/h_rms_misfit',\n", - " 'gt3r/land_ice_segments/fit_statistics/h_robust_sprd',\n", - " 'gt3r/land_ice_segments/fit_statistics/n_fit_photons',\n", - " 'gt3r/land_ice_segments/fit_statistics/n_seg_pulses',\n", - " 'gt3r/land_ice_segments/fit_statistics/sigma_h_mean',\n", - " 'gt3r/land_ice_segments/fit_statistics/signal_selection_source',\n", - " 'gt3r/land_ice_segments/fit_statistics/signal_selection_source_status',\n", - " 'gt3r/land_ice_segments/fit_statistics/snr',\n", - " 'gt3r/land_ice_segments/fit_statistics/snr_significance',\n", - " 'gt3r/land_ice_segments/fit_statistics/w_surface_window_final',\n", - " 'gt3r/land_ice_segments/geophysical/bckgrd',\n", - " 'gt3r/land_ice_segments/geophysical/bsnow_conf',\n", - " 'gt3r/land_ice_segments/geophysical/bsnow_h',\n", - " 'gt3r/land_ice_segments/geophysical/bsnow_od',\n", - " 'gt3r/land_ice_segments/geophysical/cloud_flg_asr',\n", - " 'gt3r/land_ice_segments/geophysical/cloud_flg_atm',\n", - " 'gt3r/land_ice_segments/geophysical/dac',\n", - " 'gt3r/land_ice_segments/geophysical/e_bckgrd',\n", - " 'gt3r/land_ice_segments/geophysical/layer_flag',\n", - " 'gt3r/land_ice_segments/geophysical/msw_flag',\n", - " 'gt3r/land_ice_segments/geophysical/neutat_delay_total',\n", - " 'gt3r/land_ice_segments/geophysical/r_eff',\n", - " 'gt3r/land_ice_segments/geophysical/solar_azimuth',\n", - " 'gt3r/land_ice_segments/geophysical/solar_elevation',\n", - " 'gt3r/land_ice_segments/geophysical/tide_earth',\n", - " 'gt3r/land_ice_segments/geophysical/tide_earth_free2mean',\n", - " 'gt3r/land_ice_segments/geophysical/tide_equilibrium',\n", - " 'gt3r/land_ice_segments/geophysical/tide_load',\n", - " 'gt3r/land_ice_segments/geophysical/tide_ocean',\n", - " 'gt3r/land_ice_segments/geophysical/tide_pole',\n", - " 'gt3r/land_ice_segments/ground_track/ref_azimuth',\n", - " 'gt3r/land_ice_segments/ground_track/ref_coelv',\n", - " 'gt3r/land_ice_segments/ground_track/seg_azimuth',\n", - " 'gt3r/land_ice_segments/ground_track/sigma_geo_at',\n", - " 'gt3r/land_ice_segments/ground_track/sigma_geo_r',\n", - " 'gt3r/land_ice_segments/ground_track/sigma_geo_xt',\n", - " 'gt3r/land_ice_segments/ground_track/x_atc',\n", - " 'gt3r/land_ice_segments/ground_track/y_atc',\n", - " 'gt3r/land_ice_segments/h_li',\n", - " 'gt3r/land_ice_segments/h_li_sigma',\n", - " 'gt3r/land_ice_segments/latitude',\n", - " 'gt3r/land_ice_segments/longitude',\n", - " 'gt3r/land_ice_segments/segment_id',\n", - " 'gt3r/land_ice_segments/sigma_geo_h',\n", - " 'gt3r/residual_histogram/bckgrd_per_m',\n", - " 'gt3r/residual_histogram/bin_top_h',\n", - " 'gt3r/residual_histogram/count',\n", - " 'gt3r/residual_histogram/delta_time',\n", - " 'gt3r/residual_histogram/ds_segment_id',\n", - " 'gt3r/residual_histogram/lat_mean',\n", - " 'gt3r/residual_histogram/lon_mean',\n", - " 'gt3r/residual_histogram/pulse_count',\n", - " 'gt3r/residual_histogram/segment_id_list',\n", - " 'gt3r/residual_histogram/x_atc_mean',\n", - " 'gt3r/segment_quality/delta_time',\n", - " 'gt3r/segment_quality/record_number',\n", - " 'gt3r/segment_quality/reference_pt_lat',\n", - " 'gt3r/segment_quality/reference_pt_lon',\n", - " 'gt3r/segment_quality/segment_id',\n", - " 'gt3r/segment_quality/signal_selection_source',\n", - " 'gt3r/segment_quality/signal_selection_status/signal_selection_status_all',\n", - " 'gt3r/segment_quality/signal_selection_status/signal_selection_status_backup',\n", - " 'gt3r/segment_quality/signal_selection_status/signal_selection_status_confident',\n", - " 'orbit_info/bounding_polygon_lat1',\n", - " 'orbit_info/bounding_polygon_lon1',\n", - " 'orbit_info/crossing_time',\n", - " 'orbit_info/cycle_number',\n", - " 'orbit_info/lan',\n", - " 'orbit_info/orbit_number',\n", - " 'orbit_info/rgt',\n", - " 'orbit_info/sc_orient',\n", - " 'orbit_info/sc_orient_time',\n", - " 'quality_assessment/gt1l/delta_time',\n", - " 'quality_assessment/gt1l/lat_mean',\n", - " 'quality_assessment/gt1l/lon_mean',\n", - " 'quality_assessment/gt1l/signal_selection_source_fraction_0',\n", - " 'quality_assessment/gt1l/signal_selection_source_fraction_1',\n", - " 'quality_assessment/gt1l/signal_selection_source_fraction_2',\n", - " 'quality_assessment/gt1l/signal_selection_source_fraction_3',\n", - " 'quality_assessment/gt1r/delta_time',\n", - " 'quality_assessment/gt1r/lat_mean',\n", - " 'quality_assessment/gt1r/lon_mean',\n", - " 'quality_assessment/gt1r/signal_selection_source_fraction_0',\n", - " 'quality_assessment/gt1r/signal_selection_source_fraction_1',\n", - " 'quality_assessment/gt1r/signal_selection_source_fraction_2',\n", - " 'quality_assessment/gt1r/signal_selection_source_fraction_3',\n", - " 'quality_assessment/gt2l/delta_time',\n", - " 'quality_assessment/gt2l/lat_mean',\n", - " 'quality_assessment/gt2l/lon_mean',\n", - " 'quality_assessment/gt2l/signal_selection_source_fraction_0',\n", - " 'quality_assessment/gt2l/signal_selection_source_fraction_1',\n", - " 'quality_assessment/gt2l/signal_selection_source_fraction_2',\n", - " 'quality_assessment/gt2l/signal_selection_source_fraction_3',\n", - " 'quality_assessment/gt2r/delta_time',\n", - " 'quality_assessment/gt2r/lat_mean',\n", - " 'quality_assessment/gt2r/lon_mean',\n", - " 'quality_assessment/gt2r/signal_selection_source_fraction_0',\n", - " 'quality_assessment/gt2r/signal_selection_source_fraction_1',\n", - " 'quality_assessment/gt2r/signal_selection_source_fraction_2',\n", - " 'quality_assessment/gt2r/signal_selection_source_fraction_3',\n", - " 'quality_assessment/gt3l/delta_time',\n", - " 'quality_assessment/gt3l/lat_mean',\n", - " 'quality_assessment/gt3l/lon_mean',\n", - " 'quality_assessment/gt3l/signal_selection_source_fraction_0',\n", - " 'quality_assessment/gt3l/signal_selection_source_fraction_1',\n", - " 'quality_assessment/gt3l/signal_selection_source_fraction_2',\n", - " 'quality_assessment/gt3l/signal_selection_source_fraction_3',\n", - " 'quality_assessment/gt3r/delta_time',\n", - " 'quality_assessment/gt3r/lat_mean',\n", - " 'quality_assessment/gt3r/lon_mean',\n", - " 'quality_assessment/gt3r/signal_selection_source_fraction_0',\n", - " 'quality_assessment/gt3r/signal_selection_source_fraction_1',\n", - " 'quality_assessment/gt3r/signal_selection_source_fraction_2',\n", - " 'quality_assessment/gt3r/signal_selection_source_fraction_3',\n", - " 'quality_assessment/qa_granule_fail_reason',\n", - " 'quality_assessment/qa_granule_pass_fail']" - ] - }, - "execution_count": 21, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "reader.vars.avail()" ] @@ -1635,7 +371,7 @@ }, { "cell_type": "code", - "execution_count": 28, + "execution_count": null, "id": "e3734e09", "metadata": {}, "outputs": [], @@ -1655,44 +391,10 @@ }, { "cell_type": "code", - "execution_count": 29, + "execution_count": null, "id": "e5456e36", "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "{'sc_orient': ['orbit_info/sc_orient'],\n", - " 'atlas_sdp_gps_epoch': ['ancillary_data/atlas_sdp_gps_epoch'],\n", - " 'cycle_number': ['orbit_info/cycle_number'],\n", - " 'rgt': ['orbit_info/rgt'],\n", - " 'data_start_utc': ['ancillary_data/data_start_utc'],\n", - " 'data_end_utc': ['ancillary_data/data_end_utc'],\n", - " 'h_li': ['gt1l/land_ice_segments/h_li',\n", - " 'gt1r/land_ice_segments/h_li',\n", - " 'gt2l/land_ice_segments/h_li',\n", - " 'gt2r/land_ice_segments/h_li',\n", - " 'gt3l/land_ice_segments/h_li',\n", - " 'gt3r/land_ice_segments/h_li'],\n", - " 'latitude': ['gt1l/land_ice_segments/latitude',\n", - " 'gt1r/land_ice_segments/latitude',\n", - " 'gt2l/land_ice_segments/latitude',\n", - " 'gt2r/land_ice_segments/latitude',\n", - " 'gt3l/land_ice_segments/latitude',\n", - " 'gt3r/land_ice_segments/latitude'],\n", - " 'longitude': ['gt1l/land_ice_segments/longitude',\n", - " 'gt1r/land_ice_segments/longitude',\n", - " 'gt2l/land_ice_segments/longitude',\n", - " 'gt2r/land_ice_segments/longitude',\n", - " 'gt3l/land_ice_segments/longitude',\n", - " 'gt3r/land_ice_segments/longitude']}" - ] - }, - "execution_count": 29, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "reader.vars.wanted" ] @@ -1709,7 +411,7 @@ }, { "cell_type": "code", - "execution_count": 24, + "execution_count": null, "id": "69894391", "metadata": {}, "outputs": [], @@ -1739,113 +441,10 @@ }, { "cell_type": "code", - "execution_count": 30, + "execution_count": null, "id": "eaabc976", "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", - " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", - " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", - " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", - " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", - " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", - " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", - " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", - " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", - " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", - " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", - " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:49: UserWarning: Converting non-nanosecond precision datetime values to nanosecond precision. This behavior can eventually be relaxed in xarray, as it is an artifact from pandas which is now beginning to support non-nanosecond precision values. This warning is caused by passing non-nanosecond np.datetime64 or np.timedelta64 values to the DataArray or Variable constructor; it can be silenced by converting the values to nanosecond precision ahead of time.\n", - " df.update({keyword: df[keyword].str[:-1].astype(np.datetime64)})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n", - "/home/jovyan/envs/general/lib/python3.11/site-packages/icepyx/core/read.py:490: UserWarning: rename 'delta_time' to 'photon_idx' does not create an index anymore. Try using swap_dims instead or use set_index after rename to create an indexed coordinate.\n", - " .rename({\"delta_time\": \"photon_idx\"})\n" - ] - } - ], + "outputs": [], "source": [ "ds = reader.load()" ] @@ -1866,549 +465,10 @@ }, { "cell_type": "code", - "execution_count": 26, + "execution_count": null, "id": "723256f7", "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "
<xarray.Dataset>\n",
-       "Dimensions:              (photon_idx: 29027, spot: 2, gran_idx: 6)\n",
-       "Coordinates:\n",
-       "  * photon_idx           (photon_idx) int64 0 1 2 3 ... 29023 29024 29025 29026\n",
-       "  * spot                 (spot) uint8 2 5\n",
-       "  * gran_idx             (gran_idx) float64 8.49e+04 9.02e+04 ... 1.016e+05\n",
-       "    source_file          (gran_idx) <U72 '../../../../data/ATL06/processed_AT...\n",
-       "    delta_time           (gran_idx, photon_idx) datetime64[ns] 2019-02-22T01:...\n",
-       "Data variables:\n",
-       "    sc_orient            (gran_idx) int8 0 0 0 1 1 1\n",
-       "    cycle_number         (gran_idx) int8 2 2 2 5 5 5\n",
-       "    rgt                  (gran_idx) int16 849 902 910 986 1001 1016\n",
-       "    atlas_sdp_gps_epoch  (gran_idx) datetime64[ns] 2018-01-01T00:00:18 ... 20...\n",
-       "    data_start_utc       (gran_idx) datetime64[ns] 2019-02-22T01:03:44.199777...\n",
-       "    data_end_utc         (gran_idx) datetime64[ns] 2019-02-22T01:07:38.112326...\n",
-       "    h_li                 (spot, gran_idx, photon_idx) float32 nan nan ... nan\n",
-       "    latitude             (spot, gran_idx, photon_idx) float64 nan nan ... nan\n",
-       "    longitude            (spot, gran_idx, photon_idx) float64 nan nan ... nan\n",
-       "    gt                   (gran_idx, spot) <U4 'gt3r' 'gt1l' ... 'gt1l' 'gt3r'\n",
-       "Attributes:\n",
-       "    data_product:  ATL06\n",
-       "    Description:   The land_ice_height group contains the primary set of deri...\n",
-       "    data_rate:     Data within this group are sparse.  Data values are provid...
" - ], - "text/plain": [ - "\n", - "Dimensions: (photon_idx: 29027, spot: 2, gran_idx: 6)\n", - "Coordinates:\n", - " * photon_idx (photon_idx) int64 0 1 2 3 ... 29023 29024 29025 29026\n", - " * spot (spot) uint8 2 5\n", - " * gran_idx (gran_idx) float64 8.49e+04 9.02e+04 ... 1.016e+05\n", - " source_file (gran_idx) " - ] - }, - "execution_count": 27, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "ds.plot.scatter(x=\"longitude\", y=\"latitude\", hue=\"h_li\", vmin=-100, vmax=2000)" ] From b26ca4eb0ed54cf075bf6c53f31cd78114e5c182 Mon Sep 17 00:00:00 2001 From: Rachel Wegener <35503632+rwegener2@users.noreply.github.com> Date: Fri, 1 Sep 2023 13:38:37 -0400 Subject: [PATCH 10/30] Update icepyx/core/read.py Co-authored-by: Wei Ji <23487320+weiji14@users.noreply.github.com> --- icepyx/core/read.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/icepyx/core/read.py b/icepyx/core/read.py index d3ca0d82a..2ffe32cb7 100644 --- a/icepyx/core/read.py +++ b/icepyx/core/read.py @@ -680,7 +680,7 @@ def _build_dataset_template(self, file): def _read_single_grp(self, file, grp_path): """ - For a given file and variable group path, construct an an xarray Dataset. + For a given file and variable group path, construct an xarray Dataset. Parameters ---------- From ce1ca76b7e2d586eaba3695308fae0e0bcd4805f Mon Sep 17 00:00:00 2001 From: Rachel Wegener Date: Fri, 1 Sep 2023 17:40:10 +0000 Subject: [PATCH 11/30] remove intake and related modules --- requirements.txt | 2 -- 1 file changed, 2 deletions(-) diff --git a/requirements.txt b/requirements.txt index 86618f108..06f4ad9a7 100644 --- a/requirements.txt +++ b/requirements.txt @@ -7,8 +7,6 @@ h5netcdf h5py holoviews hvplot -intake -intake-xarray matplotlib numpy requests From 431af78cd55d51fd08881e440d1a55681816db5b Mon Sep 17 00:00:00 2001 From: Rachel Wegener Date: Tue, 5 Sep 2023 16:27:50 +0000 Subject: [PATCH 12/30] mvp with new read parameters --- icepyx/core/read.py | 114 +++++++++++++++++++++++++++++--------------- 1 file changed, 75 insertions(+), 39 deletions(-) diff --git a/icepyx/core/read.py b/icepyx/core/read.py index 2ffe32cb7..c15957210 100644 --- a/icepyx/core/read.py +++ b/icepyx/core/read.py @@ -1,11 +1,14 @@ import fnmatch +import glob import os import warnings +import h5py import numpy as np import xarray as xr import icepyx.core.is2ref as is2ref +from icepyx.core.query import Query from icepyx.core.variables import Variables as Variables from icepyx.core.variables import list_of_dict_vals @@ -297,56 +300,79 @@ class Read: def __init__( self, - data_source=None, + path, # TODO how to deal with the fact that this is required in later versions + # but does not exist in past versions? + out_obj_type=None, # xr.Dataset, product=None, + data_source=None, filename_pattern="ATL{product:2}_{datetime:%Y%m%d%H%M%S}_{rgt:4}{cycle:2}{orbitsegment:2}_{version:3}_{revision:2}.h5", - out_obj_type=None, # xr.Dataset, ): - if data_source is None: - raise ValueError("Please provide a data source.") - else: - self._source_type = _check_datasource(data_source) - self.data_source = data_source - - if product is None: - raise ValueError( - "Please provide the ICESat-2 data product of your file(s)." - ) - else: - self._prod = is2ref._validate_product(product) - pattern_ck, filelist = Read._check_source_for_pattern( - data_source, filename_pattern - ) - assert pattern_ck - # Note: need to check if this works for subset and non-subset NSIDC files (processed_ prepends the former) - self._pattern = filename_pattern - - # this is a first pass at getting rid of mixed product types and warning the user. - # it takes an approach assuming the product name is in the filename, but needs reworking if we let multiple products be loaded - # one way to handle this would be bring in the product info during the loading step and fill in product there instead of requiring it from the user - filtered_filelist = [file for file in filelist if self._prod in file] - if len(filtered_filelist) == 0: - warnings.warn( - "Your filenames do not contain a product identifier (e.g. ATL06). " - "You will likely need to manually merge your dataframes." - ) - self._filelist = filelist - elif len(filtered_filelist) < len(filelist): - warnings.warn( - "Some files matching your filename pattern were removed as they were not the specified product." - ) - self._filelist = filtered_filelist + # Raise warnings for depreciated arguments + if data_source: + warnings.warn('The `data_source` argument is depreciated. Please use the path argument instead.') + # TODO this check doesn't work because default isn't None + if filename_pattern: + warnings.warn('The `filename_pattern` argument is depreciated. Instead please provide a glob string to the `path` argument') + + # CREATE THE FILELIST + # Create the filelist from the user `path` argument + if isinstance(path, list): + self._filelist = path + # Discussion: I think actually this parameter type will only exist for cloud? + # Unless we really want to abstract more stuff, i.e. the downloading + # elif isinstance(path, Query): + # self._filelist = path. + elif os.path.isdir(path): + path = os.path.join(path, '*') + # TODO better flow so ths glob doesn't happen twice + self._filelist = glob.glob(path) else: - self._filelist = filelist - + # Discussion: should we default to recursive or not? + # Could allow for glob kwargs, but at that point I think we should just tell + # the user to run glob themself to create the filelist. + self._filelist = glob.glob(path) + + # EXTRACT THE PRODUCT FOR EACH FILE + # Note for ticket: this logic got a little complex in the attempt to maintain a + # user-given product argument. If this gets depreciated we could depricate this + # Create a dictionary of the metadata extracted + product_dict = {} + for file_ in self._filelist: + product_dict[file_] = self._extract_product(file_) + # DEAL WITH MULTIPLE PRODUCTS IN THE LIST + # raise warning if there are multiple products present + if len(set(product_dict.values())) > 1: + # filter to only one product + if product: + warnings.warn(f'Multiple products found in list of files: {product_dict}. Files that do not match the user specified product will be removed from processing.') + # TODO thoughts on making filelist public read-only? It seems fair as I write + # all these warnings/error messages that reference a filelist. + self._filelist = [] + for key, value in product_dict.items(): + if value == product: + self._filelist.append(key) + product_dict.pop(key) + if len(self._filelist) == 0: + raise 'No files found in the file list matching the user-specified product type' + else: + raise TypeError(f'Multiple product types were found in the file list: {product_dict}. Please provide a valid `path` parameter indicating files of a single product') + # ASSIGN A PRODUCT TO THIS FILELIST + self.product = list(product_dict.values())[0] + if product and self.product != product: + warnings.warn(f'User specified product {product} does not match the product from the file metadata {self.product}') + + # Discussion: is this code meaningful to others? or can it be cleaned up? # after validation, use the notebook code and code outline to start implementing the rest of the class - + if out_obj_type is not None: print( "Output object type will be an xarray DataSet - " "no other output types are implemented yet" ) self._out_obj = xr.Dataset + + print('filelist:', self._filelist) + print('product', self.product) # ---------------------------------------------------------------------- # Properties @@ -379,6 +405,16 @@ def vars(self): # ---------------------------------------------------------------------- # Methods + + @staticmethod + def _extract_product(filepath): + with h5py.File(filepath, 'r') as f: + try: + product = f['METADATA']['DatasetIdentification'].attrs['shortName'].decode() + # TODO test that this is the proper error + except KeyError: + raise 'Unable to parse the product name from file metadata' + return product @staticmethod def _check_source_for_pattern(source, filename_pattern): From 612662e3ffc9395bc90557c4fdaba0a88500b068 Mon Sep 17 00:00:00 2001 From: Rachel Wegener Date: Tue, 5 Sep 2023 17:45:54 +0000 Subject: [PATCH 13/30] clean up remainder of file and remove extraneous comments --- icepyx/core/read.py | 137 +++++++++++++++++++++++++++----------------- 1 file changed, 83 insertions(+), 54 deletions(-) diff --git a/icepyx/core/read.py b/icepyx/core/read.py index c15957210..c8fe4f276 100644 --- a/icepyx/core/read.py +++ b/icepyx/core/read.py @@ -300,69 +300,83 @@ class Read: def __init__( self, - path, # TODO how to deal with the fact that this is required in later versions - # but does not exist in past versions? - out_obj_type=None, # xr.Dataset, + path=None, product=None, data_source=None, filename_pattern="ATL{product:2}_{datetime:%Y%m%d%H%M%S}_{rgt:4}{cycle:2}{orbitsegment:2}_{version:3}_{revision:2}.h5", + out_obj_type=None, # xr.Dataset, ): # Raise warnings for depreciated arguments if data_source: - warnings.warn('The `data_source` argument is depreciated. Please use the path argument instead.') - # TODO this check doesn't work because default isn't None - if filename_pattern: - warnings.warn('The `filename_pattern` argument is depreciated. Instead please provide a glob string to the `path` argument') + warnings.warn( + 'The `data_source` argument is depreciated. Please use the path argument ' + 'instead.' + ) + if filename_pattern != "ATL{product:2}_{datetime:%Y%m%d%H%M%S}_{rgt:4}{cycle:2}{orbitsegment:2}_{version:3}_{revision:2}.h5": + warnings.warn( + 'The `filename_pattern` argument is depreciated. Instead please provide a ' + 'glob string to the `path` argument' + ) + if product: + product = is2ref._validate_product(product) + warnings.warn( + 'The `product` argument is no longer required. If the `path` argument given ' + 'contains files with multiple products the `product` argument will be used ' + 'to filter that list. In all other cases the product argument is ignored. ' + 'The recommended approach is to not include a `product` argument and instead ' + 'provide a `path` with files of only a single product type`.' + ) - # CREATE THE FILELIST # Create the filelist from the user `path` argument if isinstance(path, list): self._filelist = path - # Discussion: I think actually this parameter type will only exist for cloud? - # Unless we really want to abstract more stuff, i.e. the downloading - # elif isinstance(path, Query): - # self._filelist = path. elif os.path.isdir(path): path = os.path.join(path, '*') - # TODO better flow so ths glob doesn't happen twice self._filelist = glob.glob(path) else: - # Discussion: should we default to recursive or not? - # Could allow for glob kwargs, but at that point I think we should just tell - # the user to run glob themself to create the filelist. self._filelist = glob.glob(path) + # Remove any directories from the list + self._filelist = [f for f in self._filelist if not os.path.isdir(f)] - # EXTRACT THE PRODUCT FOR EACH FILE - # Note for ticket: this logic got a little complex in the attempt to maintain a - # user-given product argument. If this gets depreciated we could depricate this - # Create a dictionary of the metadata extracted + # Create a dictionary of the products as read from the metadata product_dict = {} for file_ in self._filelist: product_dict[file_] = self._extract_product(file_) - # DEAL WITH MULTIPLE PRODUCTS IN THE LIST - # raise warning if there are multiple products present - if len(set(product_dict.values())) > 1: - # filter to only one product + + # Raise warnings or errors for muliple products or products not matching the user-specified product + all_products = list(set(product_dict.values())) + if len(all_products) > 1: if product: - warnings.warn(f'Multiple products found in list of files: {product_dict}. Files that do not match the user specified product will be removed from processing.') - # TODO thoughts on making filelist public read-only? It seems fair as I write - # all these warnings/error messages that reference a filelist. + warnings.warn( + f'Multiple products found in list of files: {product_dict}. Files that ' + 'do not match the user specified product will be removed from processing.' + ) self._filelist = [] for key, value in product_dict.items(): if value == product: self._filelist.append(key) - product_dict.pop(key) if len(self._filelist) == 0: - raise 'No files found in the file list matching the user-specified product type' + raise TypeError( + 'No files found in the file list matching the user-specified ' + 'product type' + ) + # Use the cleaned filelist to assign a product + self._product = product else: - raise TypeError(f'Multiple product types were found in the file list: {product_dict}. Please provide a valid `path` parameter indicating files of a single product') - # ASSIGN A PRODUCT TO THIS FILELIST - self.product = list(product_dict.values())[0] - if product and self.product != product: - warnings.warn(f'User specified product {product} does not match the product from the file metadata {self.product}') - - # Discussion: is this code meaningful to others? or can it be cleaned up? - # after validation, use the notebook code and code outline to start implementing the rest of the class + raise TypeError( + f'Multiple product types were found in the file list: {product_dict}.' + 'Please provide a valid `path` parameter indicating files of a single ' + 'product' + ) + else: + # Assign the identified product to the property + self._product = all_products[0] + # Raise a warning if the metadata-located product differs from the user-specified product + if product and self._product != product: + warnings.warn( + f'User specified product {product} does not match the product from the file' + ' metadata {self._product}' + ) if out_obj_type is not None: print( @@ -370,9 +384,6 @@ def __init__( "no other output types are implemented yet" ) self._out_obj = xr.Dataset - - print('filelist:', self._filelist) - print('product', self.product) # ---------------------------------------------------------------------- # Properties @@ -398,18 +409,45 @@ def vars(self): if not hasattr(self, "_read_vars"): self._read_vars = Variables( - "file", path=self._filelist[0], product=self._prod + "file", path=self.filelist[0], product=self.product ) return self._read_vars + + @property + def filelist(self): + """ + A read-only property for the user to view the list of files represented by this + Read object. + """ + return self._filelist + + @property + def num_files(self): + """ + Return the number of files that is being processed by the object + """ + return len(self.filelist) + + @property + def product(self): + """ + A read-only property for the user to view the product associated with the Read + object. + """ + return self._product # ---------------------------------------------------------------------- # Methods @staticmethod def _extract_product(filepath): + """ + Read the product type from the metadata of the file. Return the product as a string. + """ with h5py.File(filepath, 'r') as f: try: + # TODO consider: should we get this from the top level attrs instead? product = f['METADATA']['DatasetIdentification'].attrs['shortName'].decode() # TODO test that this is the proper error except KeyError: @@ -675,7 +713,7 @@ def load(self): # However, this led to errors when I tried to combine two identical datasets because the single dimension was equal. # In these situations, xarray recommends manually controlling the merge/concat process yourself. # While unlikely to be a broad issue, I've heard of multiple matching timestamps causing issues for combining multiple IS2 datasets. - for file in self._filelist: + for file in self.filelist: all_dss.append( self._build_single_file_dataset(file, groups_list) ) # wanted_groups, vgrp.keys())) @@ -710,7 +748,7 @@ def _build_dataset_template(self, file): gran_idx=[np.uint64(999999)], source_file=(["gran_idx"], [file]), ), - attrs=dict(data_product=self._prod), + attrs=dict(data_product=self.product), ) return is2ds @@ -754,20 +792,11 @@ def _build_single_file_dataset(self, file, groups_list): ------- Xarray Dataset """ - file_product = self._read_single_grp(file, "/").attrs["identifier_product_type"] - assert ( - file_product == self._prod - ), "Your product specification does not match the product specification within your files." - # I think the below method might NOT read the file into memory as the above might? - # import h5py - # with h5py.File(filepath,'r') as h5pt: - # prod_id = h5pt.attrs["identifier_product_type"] - # DEVNOTE: if and elif does not actually apply wanted variable list, and has not been tested for merging multiple files into one ds # if a gridded product # TODO: all products need to be tested, and quicklook products added or explicitly excluded # Level 3b, gridded (netcdf): ATL14, 15, 16, 17, 18, 19, 20, 21 - if self._prod in [ + if self.product in [ "ATL14", "ATL15", "ATL16", @@ -780,7 +809,7 @@ def _build_single_file_dataset(self, file, groups_list): is2ds = xr.open_dataset(file) # Level 3b, hdf5: ATL11 - elif self._prod in ["ATL11"]: + elif self.product in ["ATL11"]: is2ds = self._build_dataset_template(file) # returns the wanted groups as a single list of full group path strings From c16a00359034b5920780ce0f7719ea6c9000891d Mon Sep 17 00:00:00 2001 From: Rachel Wegener Date: Tue, 5 Sep 2023 21:06:39 +0000 Subject: [PATCH 14/30] maintain backward compatibility and combine arguments --- icepyx/core/is2ref.py | 5 +++-- icepyx/core/read.py | 51 +++++++++++++++++++++++-------------------- 2 files changed, 30 insertions(+), 26 deletions(-) diff --git a/icepyx/core/is2ref.py b/icepyx/core/is2ref.py index 883772a9e..6003d91b8 100644 --- a/icepyx/core/is2ref.py +++ b/icepyx/core/is2ref.py @@ -15,6 +15,7 @@ def _validate_product(product): """ Confirm a valid ICESat-2 product was specified """ + error_msg = "A valid product string was not provided. Check user input, if given, or file metadata." if isinstance(product, str): product = str.upper(product) assert product in [ @@ -39,9 +40,9 @@ def _validate_product(product): "ATL19", "ATL20", "ATL21", - ], "Please enter a valid product" + ], error_msg else: - raise TypeError("Please enter a product string") + raise TypeError(error_msg) return product diff --git a/icepyx/core/read.py b/icepyx/core/read.py index c8fe4f276..c900ed6c4 100644 --- a/icepyx/core/read.py +++ b/icepyx/core/read.py @@ -297,26 +297,23 @@ class Read: # ---------------------------------------------------------------------- # Constructors - + + # TODO -- update docstring + def __init__( self, - path=None, + data_source, product=None, - data_source=None, - filename_pattern="ATL{product:2}_{datetime:%Y%m%d%H%M%S}_{rgt:4}{cycle:2}{orbitsegment:2}_{version:3}_{revision:2}.h5", + filename_pattern=None, out_obj_type=None, # xr.Dataset, ): # Raise warnings for depreciated arguments - if data_source: - warnings.warn( - 'The `data_source` argument is depreciated. Please use the path argument ' - 'instead.' - ) - if filename_pattern != "ATL{product:2}_{datetime:%Y%m%d%H%M%S}_{rgt:4}{cycle:2}{orbitsegment:2}_{version:3}_{revision:2}.h5": + if filename_pattern: warnings.warn( 'The `filename_pattern` argument is depreciated. Instead please provide a ' - 'glob string to the `path` argument' + 'string, list, or glob string to the `data_source` argument.' ) + if product: product = is2ref._validate_product(product) warnings.warn( @@ -327,14 +324,21 @@ def __init__( 'provide a `path` with files of only a single product type`.' ) - # Create the filelist from the user `path` argument - if isinstance(path, list): - self._filelist = path - elif os.path.isdir(path): - path = os.path.join(path, '*') - self._filelist = glob.glob(path) + # Create the filelist from the `data_source` argument + if filename_pattern: + # maintained for backward compatibility + pattern_ck, filelist = Read._check_source_for_pattern( + data_source, filename_pattern + ) + assert pattern_ck + self._filelist = filelist + elif isinstance(data_source, list): + self._filelist = data_source + elif os.path.isdir(data_source): + data_source = os.path.join(data_source, '*') + self._filelist = glob.glob(data_source) else: - self._filelist = glob.glob(path) + self._filelist = glob.glob(data_source) # Remove any directories from the list self._filelist = [f for f in self._filelist if not os.path.isdir(f)] @@ -342,7 +346,7 @@ def __init__( product_dict = {} for file_ in self._filelist: product_dict[file_] = self._extract_product(file_) - + # Raise warnings or errors for muliple products or products not matching the user-specified product all_products = list(set(product_dict.values())) if len(all_products) > 1: @@ -417,23 +421,21 @@ def vars(self): @property def filelist(self): """ - A read-only property for the user to view the list of files represented by this - Read object. + A read-only property for viewing the list of files represented by this Read object. """ return self._filelist @property def num_files(self): """ - Return the number of files that is being processed by the object + Return the number of files that are being processed """ return len(self.filelist) @property def product(self): """ - A read-only property for the user to view the product associated with the Read - object. + A read-only property for the user to view the product associated with the Read object. """ return self._product @@ -449,6 +451,7 @@ def _extract_product(filepath): try: # TODO consider: should we get this from the top level attrs instead? product = f['METADATA']['DatasetIdentification'].attrs['shortName'].decode() + product = is2ref._validate_product(product) # TODO test that this is the proper error except KeyError: raise 'Unable to parse the product name from file metadata' From 76480783444165519b66590b31e99248b27ad35b Mon Sep 17 00:00:00 2001 From: Rachel Wegener Date: Tue, 5 Sep 2023 22:15:31 +0000 Subject: [PATCH 15/30] update to new error message --- icepyx/tests/test_is2ref.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/icepyx/tests/test_is2ref.py b/icepyx/tests/test_is2ref.py index c2ddf6e5e..7d1bba7bf 100644 --- a/icepyx/tests/test_is2ref.py +++ b/icepyx/tests/test_is2ref.py @@ -8,14 +8,14 @@ def test_num_product(): dsnum = 6 - ermsg = "Please enter a product string" + ermsg = "A valid product string was not provided. Check user input, if given, or file metadata." with pytest.raises(TypeError, match=ermsg): is2ref._validate_product(dsnum) def test_bad_product(): wrngds = "atl-6" - ermsg = "Please enter a valid product" + ermsg = "A valid product string was not provided. Check user input, if given, or file metadata." with pytest.raises(AssertionError, match=ermsg): is2ref._validate_product(wrngds) From 4cfbfdbd7cda2701ab3036cd381cd16f7f889c6c Mon Sep 17 00:00:00 2001 From: Rachel Wegener Date: Fri, 8 Sep 2023 14:16:25 +0000 Subject: [PATCH 16/30] update docs --- .../example_notebooks/IS2_data_read-in.ipynb | 180 +++++++++++++----- doc/source/user_guide/documentation/read.rst | 3 + icepyx/core/read.py | 44 +++-- 3 files changed, 165 insertions(+), 62 deletions(-) diff --git a/doc/source/example_notebooks/IS2_data_read-in.ipynb b/doc/source/example_notebooks/IS2_data_read-in.ipynb index 115c63044..9288e7da3 100644 --- a/doc/source/example_notebooks/IS2_data_read-in.ipynb +++ b/doc/source/example_notebooks/IS2_data_read-in.ipynb @@ -63,9 +63,8 @@ "metadata": {}, "outputs": [], "source": [ - "path_root = '/full/path/to/your/data/'\n", - "pattern = \"processed_ATL{product:2}_{datetime:%Y%m%d%H%M%S}_{rgt:4}{cycle:2}{orbitsegment:2}_{version:3}_{revision:2}.h5\"\n", - "reader = ipx.Read(path_root, \"ATL06\", pattern) # or ipx.Read(filepath, \"ATLXX\") if your filenames match the default pattern" + "path_root = '/full/path/to/your/ATL06_data/'\n", + "reader = ipx.Read(path_root)" ] }, { @@ -111,10 +110,9 @@ "\n", "Reading in ICESat-2 data with icepyx happens in a few simple steps:\n", "1. Let icepyx know where to find your data (this might be local files or urls to data in cloud storage)\n", - "2. Tell icepyx how to interpret the filename format\n", - "3. Create an icepyx `Read` object\n", - "4. Make a list of the variables you want to read in (does not apply for gridded products)\n", - "5. Load your data into memory (or read it in lazily, if you're using Dask)\n", + "2. Create an icepyx `Read` object\n", + "3. Make a list of the variables you want to read in (does not apply for gridded products)\n", + "4. Load your data into memory (or read it in lazily, if you're using Dask)\n", "\n", "We go through each of these steps in more detail in this notebook." ] @@ -168,17 +166,18 @@ { "cell_type": "markdown", "id": "e8da42c1", - "metadata": {}, + "metadata": { + "user_expressions": [] + }, "source": [ "### Step 1: Set data source path\n", "\n", "Provide a full path to the data to be read in (i.e. opened).\n", "Currently accepted inputs are:\n", - "* a directory\n", - "* a single file\n", - "\n", - "All files to be read in *must* have a consistent filename pattern.\n", - "If a directory is supplied as the data source, all files in any subdirectories that match the filename pattern will be included.\n", + "* a string path to directory - all files from the directory will be opened\n", + "* a string path to single file - one file will be opened\n", + "* a list of filepaths - all files in the list will be opened\n", + "* a glob string (see [glob](https://docs.python.org/3/library/glob.html)) - any files matching the glob pattern will be opened\n", "\n", "S3 bucket data access is currently under development, and requires you are registered with NSIDC as a beta tester for cloud-based ICESat-2 data.\n", "icepyx is working to ensure a smooth transition to working with remote files.\n", @@ -205,6 +204,17 @@ "# filepath = path_root + 'ATL06-20181214041627-Sample.h5'" ] }, + { + "cell_type": "code", + "execution_count": null, + "id": "fac636c2-e0eb-4e08-adaa-8f47623e46a1", + "metadata": {}, + "outputs": [], + "source": [ + "# list_of_files = ['/my/data/ATL06/processed_ATL06_20190226005526_09100205_006_02.h5', \n", + "# '/my/other/data/ATL06/processed_ATL06_20191202102922_10160505_006_01.h5']" + ] + }, { "cell_type": "code", "execution_count": null, @@ -217,77 +227,123 @@ }, { "cell_type": "markdown", - "id": "92743496", + "id": "ba3ebeb0-3091-4712-b0f7-559ddb95ca5a", "metadata": { "user_expressions": [] }, "source": [ - "### Step 2: Create a filename pattern for your data files\n", + "#### Glob Strings\n", + "\n", + "[glob](https://docs.python.org/3/library/glob.html) is a Python library which allows users to list files in their file systems whose paths match a given pattern. Icepyx uses the glob library to give users greater flexibility over their input file lists.\n", "\n", - "Files provided by NSIDC typically match the format `\"ATL{product:2}_{datetime:%Y%m%d%H%M%S}_{rgt:4}{cycle:2}{orbitsegment:2}_{version:3}_{revision:2}.h5\"` where the parameters in curly brackets indicate a parameter name (left of the colon) and character length or format (right of the colon).\n", - "Some of this information is used during data opening to help correctly read and label the data within the data structure, particularly when multiple files are opened simultaneously.\n", + "glob works using `*` and `?` as wildcard characters, where `*` matches any number of characters and `?` matches a single character. For example:\n", "\n", - "By default, icepyx will assume your filenames follow the default format.\n", - "However, you can easily read in other ICESat-2 data files by supplying your own filename pattern.\n", - "For instance, `pattern=\"ATL{product:2}-{datetime:%Y%m%d%H%M%S}-Sample.h5\"`. A few example patterns are provided below." + "* `/this/path/*.h5`: refers to all files `.h5` files in the `/this/path` folder\n", + "* `ATL??.h5`: refers to any `.h5` file that starts with `ATL` and then has any 2 characters after it\n", + "* `/this/path/ATL??/*.h5`: refers to all `.h5` files that are in a subfolder of `/this/path` which has a filename of `ATL` followed by any 2 characters\n", + "\n", + "See the glob documentation or other online explainer tutorials for more in depth explanation, or advanced glob paths such as character classes and ranges." ] }, { - "cell_type": "code", - "execution_count": null, - "id": "7318abd0", - "metadata": {}, - "outputs": [], + "cell_type": "markdown", + "id": "20286c76-5632-4420-b2c9-a5a6b1952672", + "metadata": { + "user_expressions": [] + }, "source": [ - "# pattern = 'ATL06-{datetime:%Y%m%d%H%M%S}-Sample.h5'\n", - "# pattern = 'ATL{product:2}-{datetime:%Y%m%d%H%M%S}-Sample.h5'" + "#### Recursive Directory Search" + ] + }, + { + "cell_type": "markdown", + "id": "632bd1ce-2397-4707-a63f-9d5d2fc02fbc", + "metadata": { + "user_expressions": [] + }, + "source": [ + "If specifying a directory, glob will not by default search all of the subdirectories for matching filepaths. If this is the search method you would like, you can achieve this by either:\n", + "1. passing the `recursive` argument into `glob_kwargs`\n", + "2. using glob directly to create a list of filepaths" + ] + }, + { + "cell_type": "markdown", + "id": "da0cacd8-9ddc-4c31-86b6-167d850b989e", + "metadata": { + "user_expressions": [] + }, + "source": [ + "Method 1: passing the `recursive` argument into `glob_kwargs`" ] }, { "cell_type": "code", "execution_count": null, - "id": "f43e8664", + "id": "be79b0dd-efcf-4d50-bdb0-8e3ae8e8e38c", "metadata": {}, "outputs": [], "source": [ - "# pattern = \"ATL{product:2}_{datetime:%Y%m%d%H%M%S}_{rgt:4}{cycle:2}{orbitsegment:2}_{version:3}_{revision:2}.h5\"" + "import glob" ] }, { "cell_type": "code", "execution_count": null, - "id": "992a77fb", - "metadata": {}, + "id": "5d088571-496d-479a-9fb7-833ed7e98676", + "metadata": { + "tags": [] + }, "outputs": [], "source": [ - "# grid_pattern = \"ATL{product:2}_GL_0311_{res:3}m_{version:3}_{revision:2}.nc\"" + "list_of_files = glob.glob('/path/to/my/folder', recursive=True)\n", + "ipx.Read(list_of_files)" + ] + }, + { + "cell_type": "markdown", + "id": "76de9539-710c-49f6-9e9e-238849382c33", + "metadata": { + "user_expressions": [] + }, + "source": [ + "Method 2: using glob directly to create a list of filepaths" ] }, { "cell_type": "code", "execution_count": null, - "id": "6aec1a70", + "id": "e276b876-9ec7-4991-8520-05c97824b896", "metadata": {}, "outputs": [], "source": [ - "pattern = \"processed_ATL{product:2}_{datetime:%Y%m%d%H%M%S}_{rgt:4}{cycle:2}{orbitsegment:2}_{version:3}_{revision:2}.h5\"" + "ipx.Read('/path/to/my/folder', glob_kwargs={'recursive': True})" ] }, { "cell_type": "markdown", - "id": "4275b04c", + "id": "08df2874-7c54-4670-8f37-9135ea296ff5", "metadata": { "user_expressions": [] }, "source": [ - "### Step 3: Create an icepyx read object\n", + "```{admonition} Read Module Update\n", + "Previously, icepyx required two additional things: 1) that you specify a `product` and 2) that your files either matched the default `filename_pattern` or that the user provided their own `filename_pattern`. These two requirements have been removed. `product` is not read directly from the file metadata (the root group's `short_name` attribute). Flexibility to specify multiple files via the `filename_pattern` has been replaced with [glob string](https://docs.python.org/3/library/glob.html) and allowing a list of filepaths as an argument.\n", "\n", - "The `Read` object has two required inputs:\n", - "- `path` = a string with the full file path or full directory path to your hdf5 (.h5) format files.\n", - "- `product` = the data product you're working with, also known as the \"short name\".\n", + "These arguments have been maintained for backward compatibility, but will be fully removed in icepyx version 1.0.0.\n", + "```" + ] + }, + { + "cell_type": "markdown", + "id": "4275b04c", + "metadata": { + "user_expressions": [] + }, + "source": [ + "### Step 2: Create an icepyx read object\n", "\n", - "The `Read` object also accepts the optional keyword input:\n", - "- `pattern` = a formatted string indicating the filename pattern required for Intake's path_as_pattern argument." + "Using the `data_source` described in Step 1, we can create our Read object." ] }, { @@ -299,7 +355,17 @@ }, "outputs": [], "source": [ - "reader = ipx.Read(data_source=path_root, product=\"ATL06\", filename_pattern=pattern) # or ipx.Read(filepath, \"ATLXX\") if your filenames match the default pattern" + "reader = ipx.Read(data_source=path_root)" + ] + }, + { + "cell_type": "markdown", + "id": "7b2acfdb-75eb-4c64-b583-2ab19326aaee", + "metadata": { + "user_expressions": [] + }, + "source": [ + "The Read object now contains the list of matching files that will eventually be loaded into Python. You can inspect its properties, such as the files that were located or the identified product, directly on the Read object." ] }, { @@ -309,7 +375,27 @@ "metadata": {}, "outputs": [], "source": [ - "reader._filelist" + "reader.filelist" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "248590ba-b468-4ca5-999f-4323b704008e", + "metadata": {}, + "outputs": [], + "source": [ + "reader.num_files" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "7455ee3f-f9ab-486e-b4c7-2fa2314d4084", + "metadata": {}, + "outputs": [], + "source": [ + "reader.product" ] }, { @@ -319,7 +405,7 @@ "user_expressions": [] }, "source": [ - "### Step 4: Specify variables to be read in\n", + "### Step 3: Specify variables to be read in\n", "\n", "To load your data into memory or prepare it for analysis, icepyx needs to know which variables you'd like to read in.\n", "If you've used icepyx to download data from NSIDC with variable subsetting (which is the default), then you may already be familiar with the icepyx `Variables` module and how to create and modify lists of variables.\n", @@ -426,7 +512,7 @@ "user_expressions": [] }, "source": [ - "### Step 5: Loading your data\n", + "### Step 4: Loading your data\n", "\n", "Now that you've set up all the options, you're ready to read your ICESat-2 data into memory!" ] @@ -541,9 +627,9 @@ ], "metadata": { "kernelspec": { - "display_name": "general", + "display_name": "icepyx-dev", "language": "python", - "name": "general" + "name": "icepyx-dev" }, "language_info": { "codemirror_mode": { diff --git a/doc/source/user_guide/documentation/read.rst b/doc/source/user_guide/documentation/read.rst index a5beedf4e..892f98087 100644 --- a/doc/source/user_guide/documentation/read.rst +++ b/doc/source/user_guide/documentation/read.rst @@ -19,6 +19,9 @@ Attributes .. autosummary:: :toctree: ../../_icepyx/ + Read.filelist + Read.num_files + Read.product Read.vars diff --git a/icepyx/core/read.py b/icepyx/core/read.py index c900ed6c4..90bc6be9d 100644 --- a/icepyx/core/read.py +++ b/icepyx/core/read.py @@ -8,12 +8,9 @@ import xarray as xr import icepyx.core.is2ref as is2ref -from icepyx.core.query import Query from icepyx.core.variables import Variables as Variables from icepyx.core.variables import list_of_dict_vals -# from icepyx.core.query import Query - def _make_np_datetime(df, keyword): """ @@ -267,19 +264,19 @@ class Read: Parameters ---------- - data_source : string - A string with a full file path or full directory path to ICESat-2 hdf5 (.h5) format files. - Files within a directory must have a consistent filename pattern that includes the "ATL??" data product name. - Files must all be within a single directory. + data_source : string, List + A string or list which specifies the files to be read. The string can be either: 1) the path of a single file 2) the path to a directory or 3) a [glob string](https://docs.python.org/3/library/glob.html). product : string ICESat-2 data product ID, also known as "short name" (e.g. ATL03). Available data products can be found at: https://nsidc.org/data/icesat-2/data-sets + **Depreciation warning:** This argument is no longer required and will be depreciated in version 1.0.0. The dataset product is read from the file metadata. filename_pattern : string, default 'ATL{product:2}_{datetime:%Y%m%d%H%M%S}_{rgt:4}{cycle:2}{orbitsegment:2}_{version:3}_{revision:2}.h5' String that shows the filename pattern as required for Intake's path_as_pattern argument. The default describes files downloaded directly from NSIDC (subsetted and non-subsetted) for most products (e.g. ATL06). The ATL11 filename pattern from NSIDC is: 'ATL{product:2}_{rgt:4}{orbitsegment:2}_{cycles:4}_{version:3}_{revision:2}.h5'. + **Depreciation warning:** This argument is no longer required and will be depreciated in version 1.0.0. out_obj_type : object, default xarray.Dataset The desired format for the data to be read in. @@ -292,13 +289,31 @@ class Read: Examples -------- + Reading a single file + ``` + ipx.Read('/path/to/data/processed_ATL06_20190226005526_09100205_006_02.h5') # doctest: +SKIP + ``` + Reading all files in a directory + ``` + ipx.Read('/path/to/data/') # doctest: +SKIP + ``` + Reading files that match a particular pattern (here, all .h5 files that start with `processed_ATL06_`). + ``` + ipx.Read('/path/to/data/processed_ATL06_*.h5') # doctest: +SKIP + ``` + Reading a specific list of files + ``` + list_of_files = ['/path/to/data/processed_ATL06_20190226005526_09100205_006_02.h5', + '/path/to/more/data/processed_ATL06_20191202102922_10160505_006_01.h5'] + ipx.Read(list_of_files) # doctest: +SKIP + ``` """ # ---------------------------------------------------------------------- # Constructors - # TODO -- update docstring + # TODO -- what if user passes an empty list, or the glob string returns empty def __init__( self, @@ -317,11 +332,11 @@ def __init__( if product: product = is2ref._validate_product(product) warnings.warn( - 'The `product` argument is no longer required. If the `path` argument given ' + 'The `product` argument is no longer required. If the `data_source` argument given ' 'contains files with multiple products the `product` argument will be used ' 'to filter that list. In all other cases the product argument is ignored. ' 'The recommended approach is to not include a `product` argument and instead ' - 'provide a `path` with files of only a single product type`.' + 'provide a `data_source` with files of only a single product type`.' ) # Create the filelist from the `data_source` argument @@ -369,7 +384,7 @@ def __init__( else: raise TypeError( f'Multiple product types were found in the file list: {product_dict}.' - 'Please provide a valid `path` parameter indicating files of a single ' + 'Please provide a valid `data_source` parameter indicating files of a single ' 'product' ) else: @@ -448,15 +463,14 @@ def _extract_product(filepath): Read the product type from the metadata of the file. Return the product as a string. """ with h5py.File(filepath, 'r') as f: - try: - # TODO consider: should we get this from the top level attrs instead? - product = f['METADATA']['DatasetIdentification'].attrs['shortName'].decode() + try: + product = f.attrs['short_name'].decode() product = is2ref._validate_product(product) # TODO test that this is the proper error except KeyError: raise 'Unable to parse the product name from file metadata' return product - + @staticmethod def _check_source_for_pattern(source, filename_pattern): """ From f7f823b40674fee5e83329d34518403ae285a81f Mon Sep 17 00:00:00 2001 From: Rachel Wegener Date: Fri, 8 Sep 2023 14:32:45 +0000 Subject: [PATCH 17/30] glob kwargs and list error --- icepyx/core/read.py | 14 ++++++++++---- 1 file changed, 10 insertions(+), 4 deletions(-) diff --git a/icepyx/core/read.py b/icepyx/core/read.py index 90bc6be9d..9176e6cc4 100644 --- a/icepyx/core/read.py +++ b/icepyx/core/read.py @@ -277,6 +277,8 @@ class Read: The default describes files downloaded directly from NSIDC (subsetted and non-subsetted) for most products (e.g. ATL06). The ATL11 filename pattern from NSIDC is: 'ATL{product:2}_{rgt:4}{orbitsegment:2}_{cycles:4}_{version:3}_{revision:2}.h5'. **Depreciation warning:** This argument is no longer required and will be depreciated in version 1.0.0. + glob_kwargs : dict, default {} + Additional arguments to be passed into the [glob.glob()](https://docs.python.org/3/library/glob.html#glob.glob)function out_obj_type : object, default xarray.Dataset The desired format for the data to be read in. @@ -313,13 +315,12 @@ class Read: # ---------------------------------------------------------------------- # Constructors - # TODO -- what if user passes an empty list, or the glob string returns empty - def __init__( self, data_source, product=None, filename_pattern=None, + glob_kwargs = {}, out_obj_type=None, # xr.Dataset, ): # Raise warnings for depreciated arguments @@ -351,9 +352,9 @@ def __init__( self._filelist = data_source elif os.path.isdir(data_source): data_source = os.path.join(data_source, '*') - self._filelist = glob.glob(data_source) + self._filelist = glob.glob(data_source, **glob_kwargs) else: - self._filelist = glob.glob(data_source) + self._filelist = glob.glob(data_source, **glob_kwargs) # Remove any directories from the list self._filelist = [f for f in self._filelist if not os.path.isdir(f)] @@ -387,6 +388,11 @@ def __init__( 'Please provide a valid `data_source` parameter indicating files of a single ' 'product' ) + elif len(all_products) == 0: + raise TypeError( + 'No files found matching the specified `data_source`. Check your glob ' + 'string or file list.' + ) else: # Assign the identified product to the property self._product = all_products[0] From 203f3adafc085bce44d0fd993b5932f60366f33c Mon Sep 17 00:00:00 2001 From: Rachel Wegener Date: Fri, 8 Sep 2023 14:44:22 +0000 Subject: [PATCH 18/30] formatting updates --- .../example_notebooks/IS2_data_read-in.ipynb | 42 ++++++++++--------- icepyx/core/read.py | 18 ++++---- 2 files changed, 33 insertions(+), 27 deletions(-) diff --git a/doc/source/example_notebooks/IS2_data_read-in.ipynb b/doc/source/example_notebooks/IS2_data_read-in.ipynb index 9288e7da3..0ab4a4dfa 100644 --- a/doc/source/example_notebooks/IS2_data_read-in.ipynb +++ b/doc/source/example_notebooks/IS2_data_read-in.ipynb @@ -262,7 +262,9 @@ "user_expressions": [] }, "source": [ - "If specifying a directory, glob will not by default search all of the subdirectories for matching filepaths. If this is the search method you would like, you can achieve this by either:\n", + "glob will not by default search all of the subdirectories for matching filepaths, but it has the ability to do so. To search recursively you need to 1) use `/**/` in the filepath to match any level of nested folders and 2) use the `recursive=True` argument. \n", + "\n", + "If you would like to search recursively, you can achieve this by either:\n", "1. passing the `recursive` argument into `glob_kwargs`\n", "2. using glob directly to create a list of filepaths" ] @@ -280,24 +282,11 @@ { "cell_type": "code", "execution_count": null, - "id": "be79b0dd-efcf-4d50-bdb0-8e3ae8e8e38c", + "id": "e276b876-9ec7-4991-8520-05c97824b896", "metadata": {}, "outputs": [], "source": [ - "import glob" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "5d088571-496d-479a-9fb7-833ed7e98676", - "metadata": { - "tags": [] - }, - "outputs": [], - "source": [ - "list_of_files = glob.glob('/path/to/my/folder', recursive=True)\n", - "ipx.Read(list_of_files)" + "ipx.Read('/path/to/**/folder', glob_kwargs={'recursive': True})" ] }, { @@ -313,11 +302,24 @@ { "cell_type": "code", "execution_count": null, - "id": "e276b876-9ec7-4991-8520-05c97824b896", + "id": "be79b0dd-efcf-4d50-bdb0-8e3ae8e8e38c", "metadata": {}, "outputs": [], "source": [ - "ipx.Read('/path/to/my/folder', glob_kwargs={'recursive': True})" + "import glob" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "5d088571-496d-479a-9fb7-833ed7e98676", + "metadata": { + "tags": [] + }, + "outputs": [], + "source": [ + "list_of_files = glob.glob('/path/to/**/folder', recursive=True)\n", + "ipx.Read(list_of_files)" ] }, { @@ -328,9 +330,9 @@ }, "source": [ "```{admonition} Read Module Update\n", - "Previously, icepyx required two additional things: 1) that you specify a `product` and 2) that your files either matched the default `filename_pattern` or that the user provided their own `filename_pattern`. These two requirements have been removed. `product` is not read directly from the file metadata (the root group's `short_name` attribute). Flexibility to specify multiple files via the `filename_pattern` has been replaced with [glob string](https://docs.python.org/3/library/glob.html) and allowing a list of filepaths as an argument.\n", + "Previously, icepyx required two additional conditions: 1) a `product` argument and 2) that your files either matched the default `filename_pattern` or that the user provided their own `filename_pattern`. These two requirements have been removed. `product` is now read directly from the file metadata (the root group's `short_name` attribute). Flexibility to specify multiple files via the `filename_pattern` has been replaced with the [glob string](https://docs.python.org/3/library/glob.html) feature, and by allowing a list of filepaths as an argument.\n", "\n", - "These arguments have been maintained for backward compatibility, but will be fully removed in icepyx version 1.0.0.\n", + "The `product` and `filename_pattern` arguments have been maintained for backwards compatibility, but will be fully removed in icepyx version 1.0.0.\n", "```" ] }, diff --git a/icepyx/core/read.py b/icepyx/core/read.py index 9176e6cc4..f5cb53f8f 100644 --- a/icepyx/core/read.py +++ b/icepyx/core/read.py @@ -327,7 +327,8 @@ def __init__( if filename_pattern: warnings.warn( 'The `filename_pattern` argument is depreciated. Instead please provide a ' - 'string, list, or glob string to the `data_source` argument.' + 'string, list, or glob string to the `data_source` argument.', + stacklevel=2, ) if product: @@ -337,7 +338,8 @@ def __init__( 'contains files with multiple products the `product` argument will be used ' 'to filter that list. In all other cases the product argument is ignored. ' 'The recommended approach is to not include a `product` argument and instead ' - 'provide a `data_source` with files of only a single product type`.' + 'provide a `data_source` with files of only a single product type`.', + stacklevel=2, ) # Create the filelist from the `data_source` argument @@ -369,7 +371,8 @@ def __init__( if product: warnings.warn( f'Multiple products found in list of files: {product_dict}. Files that ' - 'do not match the user specified product will be removed from processing.' + 'do not match the user specified product will be removed from processing.', + stacklevel=2, ) self._filelist = [] for key, value in product_dict.items(): @@ -400,7 +403,8 @@ def __init__( if product and self._product != product: warnings.warn( f'User specified product {product} does not match the product from the file' - ' metadata {self._product}' + ' metadata {self._product}', + stacklevel=2, ) if out_obj_type is not None: @@ -442,21 +446,21 @@ def vars(self): @property def filelist(self): """ - A read-only property for viewing the list of files represented by this Read object. + Return the list of files represented by this Read object. """ return self._filelist @property def num_files(self): """ - Return the number of files that are being processed + Return the number of files that are being processed. """ return len(self.filelist) @property def product(self): """ - A read-only property for the user to view the product associated with the Read object. + Return the product associated with the Read object. """ return self._product From 10d15910a1f82ec2b18ba61eff647e243d44651c Mon Sep 17 00:00:00 2001 From: Rachel Wegener <35503632+rwegener2@users.noreply.github.com> Date: Tue, 12 Sep 2023 09:18:22 -0400 Subject: [PATCH 19/30] Apply suggestions from code review Co-authored-by: Jessica Scheick --- icepyx/core/read.py | 27 +++++++++++---------------- 1 file changed, 11 insertions(+), 16 deletions(-) diff --git a/icepyx/core/read.py b/icepyx/core/read.py index f5cb53f8f..c45a72fa9 100644 --- a/icepyx/core/read.py +++ b/icepyx/core/read.py @@ -272,8 +272,8 @@ class Read: Available data products can be found at: https://nsidc.org/data/icesat-2/data-sets **Depreciation warning:** This argument is no longer required and will be depreciated in version 1.0.0. The dataset product is read from the file metadata. - filename_pattern : string, default 'ATL{product:2}_{datetime:%Y%m%d%H%M%S}_{rgt:4}{cycle:2}{orbitsegment:2}_{version:3}_{revision:2}.h5' - String that shows the filename pattern as required for Intake's path_as_pattern argument. + filename_pattern : string, default None + String that shows the filename pattern as previously required for Intake's path_as_pattern argument. The default describes files downloaded directly from NSIDC (subsetted and non-subsetted) for most products (e.g. ATL06). The ATL11 filename pattern from NSIDC is: 'ATL{product:2}_{rgt:4}{orbitsegment:2}_{cycles:4}_{version:3}_{revision:2}.h5'. **Depreciation warning:** This argument is no longer required and will be depreciated in version 1.0.0. @@ -292,23 +292,18 @@ class Read: Examples -------- Reading a single file - ``` - ipx.Read('/path/to/data/processed_ATL06_20190226005526_09100205_006_02.h5') # doctest: +SKIP - ``` + >>> ipx.Read('/path/to/data/processed_ATL06_20190226005526_09100205_006_02.h5') # doctest: +SKIP + Reading all files in a directory - ``` - ipx.Read('/path/to/data/') # doctest: +SKIP - ``` + >>> ipx.Read('/path/to/data/') # doctest: +SKIP + Reading files that match a particular pattern (here, all .h5 files that start with `processed_ATL06_`). - ``` - ipx.Read('/path/to/data/processed_ATL06_*.h5') # doctest: +SKIP - ``` + >>> ipx.Read('/path/to/data/processed_ATL06_*.h5') # doctest: +SKIP + Reading a specific list of files - ``` - list_of_files = ['/path/to/data/processed_ATL06_20190226005526_09100205_006_02.h5', + >>> list_of_files = ['/path/to/data/processed_ATL06_20190226005526_09100205_006_02.h5', '/path/to/more/data/processed_ATL06_20191202102922_10160505_006_01.h5'] - ipx.Read(list_of_files) # doctest: +SKIP - ``` + >>> ipx.Read(list_of_files) # doctest: +SKIP """ @@ -326,7 +321,7 @@ def __init__( # Raise warnings for depreciated arguments if filename_pattern: warnings.warn( - 'The `filename_pattern` argument is depreciated. Instead please provide a ' + 'The `filename_pattern` argument is deprecated. Instead please provide a ' 'string, list, or glob string to the `data_source` argument.', stacklevel=2, ) From 0b23d1e12808fb69afa85d1fa5168c17221f52f2 Mon Sep 17 00:00:00 2001 From: Rachel Wegener Date: Tue, 12 Sep 2023 13:24:45 +0000 Subject: [PATCH 20/30] remove num_files --- doc/source/user_guide/documentation/read.rst | 1 - icepyx/core/read.py | 7 ------- 2 files changed, 8 deletions(-) diff --git a/doc/source/user_guide/documentation/read.rst b/doc/source/user_guide/documentation/read.rst index 892f98087..68da03b1d 100644 --- a/doc/source/user_guide/documentation/read.rst +++ b/doc/source/user_guide/documentation/read.rst @@ -20,7 +20,6 @@ Attributes :toctree: ../../_icepyx/ Read.filelist - Read.num_files Read.product Read.vars diff --git a/icepyx/core/read.py b/icepyx/core/read.py index c45a72fa9..b139ca567 100644 --- a/icepyx/core/read.py +++ b/icepyx/core/read.py @@ -444,13 +444,6 @@ def filelist(self): Return the list of files represented by this Read object. """ return self._filelist - - @property - def num_files(self): - """ - Return the number of files that are being processed. - """ - return len(self.filelist) @property def product(self): From 6f5beadcb8bca332fbf9fbda79310e075bbd8af3 Mon Sep 17 00:00:00 2001 From: Rachel Wegener Date: Tue, 12 Sep 2023 13:28:03 +0000 Subject: [PATCH 21/30] fix docs test typo --- icepyx/core/read.py | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/icepyx/core/read.py b/icepyx/core/read.py index b139ca567..4300cebbc 100644 --- a/icepyx/core/read.py +++ b/icepyx/core/read.py @@ -301,8 +301,10 @@ class Read: >>> ipx.Read('/path/to/data/processed_ATL06_*.h5') # doctest: +SKIP Reading a specific list of files - >>> list_of_files = ['/path/to/data/processed_ATL06_20190226005526_09100205_006_02.h5', - '/path/to/more/data/processed_ATL06_20191202102922_10160505_006_01.h5'] + >>> list_of_files = [ + '/path/to/data/processed_ATL06_20190226005526_09100205_006_02.h5', + '/path/to/more/data/processed_ATL06_20191202102922_10160505_006_01.h5', + ] >>> ipx.Read(list_of_files) # doctest: +SKIP """ From 035ee5ab1e33dc43a471c36286a59c036d0cb292 Mon Sep 17 00:00:00 2001 From: Rachel Wegener Date: Tue, 12 Sep 2023 13:37:15 +0000 Subject: [PATCH 22/30] trying again to fix the build --- icepyx/core/read.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/icepyx/core/read.py b/icepyx/core/read.py index 4300cebbc..b9a6e672e 100644 --- a/icepyx/core/read.py +++ b/icepyx/core/read.py @@ -302,9 +302,9 @@ class Read: Reading a specific list of files >>> list_of_files = [ - '/path/to/data/processed_ATL06_20190226005526_09100205_006_02.h5', - '/path/to/more/data/processed_ATL06_20191202102922_10160505_006_01.h5', - ] + ... '/path/to/data/processed_ATL06_20190226005526_09100205_006_02.h5', + ... '/path/to/more/data/processed_ATL06_20191202102922_10160505_006_01.h5', + ... ] >>> ipx.Read(list_of_files) # doctest: +SKIP """ From 903c351007bc7245bf4d107b48b1f38c67acf900 Mon Sep 17 00:00:00 2001 From: Rachel Wegener Date: Tue, 12 Sep 2023 13:48:27 +0000 Subject: [PATCH 23/30] add feedback to docs page --- .../example_notebooks/IS2_data_read-in.ipynb | 42 +++++++------------ 1 file changed, 14 insertions(+), 28 deletions(-) diff --git a/doc/source/example_notebooks/IS2_data_read-in.ipynb b/doc/source/example_notebooks/IS2_data_read-in.ipynb index 0ab4a4dfa..4cdd3bf5a 100644 --- a/doc/source/example_notebooks/IS2_data_read-in.ipynb +++ b/doc/source/example_notebooks/IS2_data_read-in.ipynb @@ -177,11 +177,7 @@ "* a string path to directory - all files from the directory will be opened\n", "* a string path to single file - one file will be opened\n", "* a list of filepaths - all files in the list will be opened\n", - "* a glob string (see [glob](https://docs.python.org/3/library/glob.html)) - any files matching the glob pattern will be opened\n", - "\n", - "S3 bucket data access is currently under development, and requires you are registered with NSIDC as a beta tester for cloud-based ICESat-2 data.\n", - "icepyx is working to ensure a smooth transition to working with remote files.\n", - "We'd love your help exploring and testing these features as they become available!" + "* a glob string (see [glob](https://docs.python.org/3/library/glob.html)) - any files matching the glob pattern will be opened" ] }, { @@ -215,16 +211,6 @@ "# '/my/other/data/ATL06/processed_ATL06_20191202102922_10160505_006_01.h5']" ] }, - { - "cell_type": "code", - "execution_count": null, - "id": "e683ebf7", - "metadata": {}, - "outputs": [], - "source": [ - "# urlpath = 's3://nsidc-cumulus-prod-protected/ATLAS/ATL03/004/2019/11/30/ATL03_20191130221008_09930503_004_01.h5'" - ] - }, { "cell_type": "markdown", "id": "ba3ebeb0-3091-4712-b0f7-559ddb95ca5a", @@ -238,9 +224,9 @@ "\n", "glob works using `*` and `?` as wildcard characters, where `*` matches any number of characters and `?` matches a single character. For example:\n", "\n", - "* `/this/path/*.h5`: refers to all files `.h5` files in the `/this/path` folder\n", - "* `ATL??.h5`: refers to any `.h5` file that starts with `ATL` and then has any 2 characters after it\n", - "* `/this/path/ATL??/*.h5`: refers to all `.h5` files that are in a subfolder of `/this/path` which has a filename of `ATL` followed by any 2 characters\n", + "* `/this/path/*.h5`: refers to all `.h5` files in the `/this/path` folder (Example matches: \"/this/path/processed_ATL03_20191130221008_09930503_006_01.h5\" or \"/this/path/myfavoriteicsat-2file.h5\")\n", + "* `/this/path/*ATL07*.h5`: refers to all `.h5` files in the `/this/path` folder that have ATL07 in the filename. (Example matches: \"/this/path/ATL07-02_20221012220720_03391701_005_01.h5\" or \"/this/path/processed_ATL07.h5\")\n", + "* `/this/path/ATL??/*.h5`: refers to all `.h5` files that are in a subfolder of `/this/path` and a subdirectory of `ATL` followed by any 2 characters (Example matches: \"/this/path/ATL03/processed_ATL03_20191130221008_09930503_006_01.h5\", \"/this/path/ATL06/myfile.h5\")\n", "\n", "See the glob documentation or other online explainer tutorials for more in depth explanation, or advanced glob paths such as character classes and ranges." ] @@ -289,6 +275,16 @@ "ipx.Read('/path/to/**/folder', glob_kwargs={'recursive': True})" ] }, + { + "cell_type": "markdown", + "id": "f5a1e85e-fc4a-405f-9710-0cb61b827f2c", + "metadata": { + "user_expressions": [] + }, + "source": [ + "You can use `glob_kwargs` for any additional argument to Python's builtin `glob.glob` that you would like to pass in via icepyx." + ] + }, { "cell_type": "markdown", "id": "76de9539-710c-49f6-9e9e-238849382c33", @@ -380,16 +376,6 @@ "reader.filelist" ] }, - { - "cell_type": "code", - "execution_count": null, - "id": "248590ba-b468-4ca5-999f-4323b704008e", - "metadata": {}, - "outputs": [], - "source": [ - "reader.num_files" - ] - }, { "cell_type": "code", "execution_count": null, From 5e06de94da0c492b4b3cc94a5b4d834b0dc829a4 Mon Sep 17 00:00:00 2001 From: Rachel Wegener Date: Thu, 14 Sep 2023 13:32:52 +0000 Subject: [PATCH 24/30] fix typo --- icepyx/core/read.py | 1 - 1 file changed, 1 deletion(-) diff --git a/icepyx/core/read.py b/icepyx/core/read.py index baeba27f4..966df8d08 100644 --- a/icepyx/core/read.py +++ b/icepyx/core/read.py @@ -338,7 +338,6 @@ def __init__( if data_source is None: raise ValueError("data_source is a required arguemnt") - ) # Raise warnings for deprecated arguments if filename_pattern: From b2c273518bee22f8f1417d51cdaf3a39958bc56e Mon Sep 17 00:00:00 2001 From: Jessica Scheick Date: Mon, 9 Oct 2023 15:59:03 -0400 Subject: [PATCH 25/30] depreciate -> deprecate --- icepyx/core/read.py | 80 ++++++++++++++++++++++----------------------- 1 file changed, 40 insertions(+), 40 deletions(-) diff --git a/icepyx/core/read.py b/icepyx/core/read.py index 966df8d08..e687511d1 100644 --- a/icepyx/core/read.py +++ b/icepyx/core/read.py @@ -272,18 +272,18 @@ class Read: product : string ICESat-2 data product ID, also known as "short name" (e.g. ATL03). Available data products can be found at: https://nsidc.org/data/icesat-2/data-sets - **Depreciation warning:** This argument is no longer required and will be depreciated in version 1.0.0. The dataset product is read from the file metadata. + **Deprecation warning:** This argument is no longer required and will be deprecated in version 1.0.0. The dataset product is read from the file metadata. filename_pattern : string, default None String that shows the filename pattern as previously required for Intake's path_as_pattern argument. The default describes files downloaded directly from NSIDC (subsetted and non-subsetted) for most products (e.g. ATL06). The ATL11 filename pattern from NSIDC is: 'ATL{product:2}_{rgt:4}{orbitsegment:2}_{cycles:4}_{version:3}_{revision:2}.h5'. - **Depreciation warning:** This argument is no longer required and will be depreciated in version 1.0.0. - + **Deprecation warning:** This argument is no longer required and will be deprecated in version 1.0.0. + catalog : string, default None Full path to an Intake catalog for reading in data. If you still need to create a catalog, leave as default. - **Deprecation warning:** This argument has been depreciated. Please use the data_source argument to pass in valid data. + **Deprecation warning:** This argument has been deprecated. Please use the data_source argument to pass in valid data. glob_kwargs : dict, default {} Additional arguments to be passed into the [glob.glob()](https://docs.python.org/3/library/glob.html#glob.glob)function @@ -310,7 +310,7 @@ class Read: Reading a specific list of files >>> list_of_files = [ - ... '/path/to/data/processed_ATL06_20190226005526_09100205_006_02.h5', + ... '/path/to/data/processed_ATL06_20190226005526_09100205_006_02.h5', ... '/path/to/more/data/processed_ATL06_20191202102922_10160505_006_01.h5', ... ] >>> ipx.Read(list_of_files) # doctest: +SKIP @@ -319,42 +319,42 @@ class Read: # ---------------------------------------------------------------------- # Constructors - + def __init__( self, data_source=None, # DevNote: Make this a required arg when catalog is removed product=None, filename_pattern=None, catalog=None, - glob_kwargs = {}, + glob_kwargs={}, out_obj_type=None, # xr.Dataset, ): # Raise error for deprecated argument if catalog: raise DeprecationError( - 'The `catalog` argument has been deprecated and intake is no longer supported. ' - 'Please use the `data_source` argument to specify your dataset instead.' + "The `catalog` argument has been deprecated and intake is no longer supported. " + "Please use the `data_source` argument to specify your dataset instead." ) - + if data_source is None: raise ValueError("data_source is a required arguemnt") - + # Raise warnings for deprecated arguments if filename_pattern: warnings.warn( - 'The `filename_pattern` argument is deprecated. Instead please provide a ' - 'string, list, or glob string to the `data_source` argument.', + "The `filename_pattern` argument is deprecated. Instead please provide a " + "string, list, or glob string to the `data_source` argument.", stacklevel=2, ) - + if product: product = is2ref._validate_product(product) warnings.warn( - 'The `product` argument is no longer required. If the `data_source` argument given ' - 'contains files with multiple products the `product` argument will be used ' - 'to filter that list. In all other cases the product argument is ignored. ' - 'The recommended approach is to not include a `product` argument and instead ' - 'provide a `data_source` with files of only a single product type`.', + "The `product` argument is no longer required. If the `data_source` argument given " + "contains files with multiple products the `product` argument will be used " + "to filter that list. In all other cases the product argument is ignored. " + "The recommended approach is to not include a `product` argument and instead " + "provide a `data_source` with files of only a single product type`.", stacklevel=2, ) @@ -369,7 +369,7 @@ def __init__( elif isinstance(data_source, list): self._filelist = data_source elif os.path.isdir(data_source): - data_source = os.path.join(data_source, '*') + data_source = os.path.join(data_source, "*") self._filelist = glob.glob(data_source, **glob_kwargs) else: self._filelist = glob.glob(data_source, **glob_kwargs) @@ -380,14 +380,14 @@ def __init__( product_dict = {} for file_ in self._filelist: product_dict[file_] = self._extract_product(file_) - + # Raise warnings or errors for muliple products or products not matching the user-specified product all_products = list(set(product_dict.values())) if len(all_products) > 1: if product: warnings.warn( - f'Multiple products found in list of files: {product_dict}. Files that ' - 'do not match the user specified product will be removed from processing.', + f"Multiple products found in list of files: {product_dict}. Files that " + "do not match the user specified product will be removed from processing.", stacklevel=2, ) self._filelist = [] @@ -396,21 +396,21 @@ def __init__( self._filelist.append(key) if len(self._filelist) == 0: raise TypeError( - 'No files found in the file list matching the user-specified ' - 'product type' + "No files found in the file list matching the user-specified " + "product type" ) # Use the cleaned filelist to assign a product self._product = product else: raise TypeError( - f'Multiple product types were found in the file list: {product_dict}.' - 'Please provide a valid `data_source` parameter indicating files of a single ' - 'product' + f"Multiple product types were found in the file list: {product_dict}." + "Please provide a valid `data_source` parameter indicating files of a single " + "product" ) elif len(all_products) == 0: raise TypeError( - 'No files found matching the specified `data_source`. Check your glob ' - 'string or file list.' + "No files found matching the specified `data_source`. Check your glob " + "string or file list." ) else: # Assign the identified product to the property @@ -418,11 +418,11 @@ def __init__( # Raise a warning if the metadata-located product differs from the user-specified product if product and self._product != product: warnings.warn( - f'User specified product {product} does not match the product from the file' - ' metadata {self._product}', + f"User specified product {product} does not match the product from the file" + " metadata {self._product}", stacklevel=2, ) - + if out_obj_type is not None: print( "Output object type will be an xarray DataSet - " @@ -458,7 +458,7 @@ def vars(self): ) return self._read_vars - + @property def filelist(self): """ @@ -475,21 +475,21 @@ def product(self): # ---------------------------------------------------------------------- # Methods - + @staticmethod def _extract_product(filepath): """ Read the product type from the metadata of the file. Return the product as a string. """ - with h5py.File(filepath, 'r') as f: - try: - product = f.attrs['short_name'].decode() + with h5py.File(filepath, "r") as f: + try: + product = f.attrs["short_name"].decode() product = is2ref._validate_product(product) # TODO test that this is the proper error except KeyError: - raise 'Unable to parse the product name from file metadata' + raise "Unable to parse the product name from file metadata" return product - + @staticmethod def _check_source_for_pattern(source, filename_pattern): """ From 6b953f9c63151c20a5224dc9e38db5b73dae02f8 Mon Sep 17 00:00:00 2001 From: Rachel Wegener <35503632+rwegener2@users.noreply.github.com> Date: Tue, 10 Oct 2023 09:13:51 -0400 Subject: [PATCH 26/30] Apply suggestions from code review Co-authored-by: Jessica Scheick --- icepyx/core/read.py | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/icepyx/core/read.py b/icepyx/core/read.py index e687511d1..c63c6d954 100644 --- a/icepyx/core/read.py +++ b/icepyx/core/read.py @@ -268,6 +268,7 @@ class Read: ---------- data_source : string, List A string or list which specifies the files to be read. The string can be either: 1) the path of a single file 2) the path to a directory or 3) a [glob string](https://docs.python.org/3/library/glob.html). + The List must be a list of strings, each of which is the path of a single file. product : string ICESat-2 data product ID, also known as "short name" (e.g. ATL03). @@ -322,7 +323,7 @@ class Read: def __init__( self, - data_source=None, # DevNote: Make this a required arg when catalog is removed + data_source=None, product=None, filename_pattern=None, catalog=None, @@ -381,7 +382,7 @@ def __init__( for file_ in self._filelist: product_dict[file_] = self._extract_product(file_) - # Raise warnings or errors for muliple products or products not matching the user-specified product + # Raise warnings or errors for multiple products or products not matching the user-specified product all_products = list(set(product_dict.values())) if len(all_products) > 1: if product: From 45704a4e94368b7fe64466908aaff45fdc78f5db Mon Sep 17 00:00:00 2001 From: Rachel Wegener <35503632+rwegener2@users.noreply.github.com> Date: Tue, 10 Oct 2023 11:33:16 -0400 Subject: [PATCH 27/30] elaborate on multiple products warning --- icepyx/core/read.py | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/icepyx/core/read.py b/icepyx/core/read.py index c63c6d954..eb4d1168d 100644 --- a/icepyx/core/read.py +++ b/icepyx/core/read.py @@ -388,7 +388,9 @@ def __init__( if product: warnings.warn( f"Multiple products found in list of files: {product_dict}. Files that " - "do not match the user specified product will be removed from processing.", + "do not match the user specified product will be removed from processing.\n" + "Filtering files using a `product` argument is deprecated. Please use the " + "`data_source` argument to specify a list of files with the same product.", stacklevel=2, ) self._filelist = [] From 2bf28086f00bab031390bf85cc81baa5257e8bce Mon Sep 17 00:00:00 2001 From: Rachel Wegener Date: Tue, 10 Oct 2023 15:46:56 +0000 Subject: [PATCH 28/30] clarify glob section --- doc/source/example_notebooks/IS2_data_read-in.ipynb | 8 +++++--- 1 file changed, 5 insertions(+), 3 deletions(-) diff --git a/doc/source/example_notebooks/IS2_data_read-in.ipynb b/doc/source/example_notebooks/IS2_data_read-in.ipynb index 4cdd3bf5a..9bbac368b 100644 --- a/doc/source/example_notebooks/IS2_data_read-in.ipynb +++ b/doc/source/example_notebooks/IS2_data_read-in.ipynb @@ -248,11 +248,13 @@ "user_expressions": [] }, "source": [ - "glob will not by default search all of the subdirectories for matching filepaths, but it has the ability to do so. To search recursively you need to 1) use `/**/` in the filepath to match any level of nested folders and 2) use the `recursive=True` argument. \n", + "glob will not by default search all of the subdirectories for matching filepaths, but it has the ability to do so.\n", "\n", "If you would like to search recursively, you can achieve this by either:\n", - "1. passing the `recursive` argument into `glob_kwargs`\n", - "2. using glob directly to create a list of filepaths" + "1. passing the `recursive` argument into `glob_kwargs` and including `\\**\\` in your filepath\n", + "2. using glob directly to create a list of filepaths\n", + "\n", + "Each of these two methods are shown below." ] }, { From 12428817b9445daba3933e5a75d885d622aef1ad Mon Sep 17 00:00:00 2001 From: Rachel Wegener Date: Tue, 10 Oct 2023 16:05:26 +0000 Subject: [PATCH 29/30] test product name error --- icepyx/core/read.py | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/icepyx/core/read.py b/icepyx/core/read.py index eb4d1168d..a85ee659b 100644 --- a/icepyx/core/read.py +++ b/icepyx/core/read.py @@ -488,9 +488,10 @@ def _extract_product(filepath): try: product = f.attrs["short_name"].decode() product = is2ref._validate_product(product) - # TODO test that this is the proper error except KeyError: - raise "Unable to parse the product name from file metadata" + raise AttributeError( + f"Unable to extract the product name from file metadata." + ) return product @staticmethod From e18cf7a67adf9944de9a054d6ee0fcb91211c881 Mon Sep 17 00:00:00 2001 From: GitHub Action Date: Wed, 18 Oct 2023 17:49:35 +0000 Subject: [PATCH 30/30] GitHub action UML generation auto-update --- .../documentation/classes_dev_uml.svg | 122 +++++++++--------- .../documentation/classes_user_uml.svg | 21 +-- 2 files changed, 72 insertions(+), 71 deletions(-) diff --git a/doc/source/user_guide/documentation/classes_dev_uml.svg b/doc/source/user_guide/documentation/classes_dev_uml.svg index 34e13b41c..0cd08c9e9 100644 --- a/doc/source/user_guide/documentation/classes_dev_uml.svg +++ b/doc/source/user_guide/documentation/classes_dev_uml.svg @@ -4,11 +4,11 @@ - + classes_dev_uml - + icepyx.core.auth.AuthenticationError @@ -139,38 +139,38 @@ icepyx.core.icesat2data.Icesat2Data - -Icesat2Data - - -__init__() + +Icesat2Data + + +__init__() icepyx.core.exceptions.NsidcQueryError - -NsidcQueryError - -errmsg -msgtxt : str - -__init__(errmsg, msgtxt) -__str__() + +NsidcQueryError + +errmsg +msgtxt : str + +__init__(errmsg, msgtxt) +__str__() icepyx.core.exceptions.QueryError - -QueryError - - - + +QueryError + + + icepyx.core.exceptions.NsidcQueryError->icepyx.core.exceptions.QueryError - - + + @@ -235,24 +235,24 @@ icepyx.core.read.Read - -Read - -_filelist : NoneType, list -_out_obj : Dataset -_pattern : str -_prod : str -_read_vars -_source_type : str -data_source -vars - -__init__(data_source, product, filename_pattern, catalog, out_obj_type) -_add_vars_to_ds(is2ds, ds, grp_path, wanted_groups_tiered, wanted_dict) -_build_dataset_template(file) -_build_single_file_dataset(file, groups_list) -_check_source_for_pattern(source, filename_pattern) -_combine_nested_vars(is2ds, ds, grp_path, wanted_dict) + +Read + +_filelist : NoneType, list +_out_obj : Dataset +_product : NoneType, str +_read_vars +filelist +product +vars + +__init__(data_source, product, filename_pattern, catalog, glob_kwargs, out_obj_type) +_add_vars_to_ds(is2ds, ds, grp_path, wanted_groups_tiered, wanted_dict) +_build_dataset_template(file) +_build_single_file_dataset(file, groups_list) +_check_source_for_pattern(source, filename_pattern) +_combine_nested_vars(is2ds, ds, grp_path, wanted_dict) +_extract_product(filepath) _read_single_grp(file, grp_path) load() @@ -366,30 +366,30 @@ icepyx.core.variables.Variables->icepyx.core.read.Read - - -_read_vars + + +_read_vars icepyx.core.visualization.Visualize - -Visualize - -bbox : list -cycles : NoneType -date_range : NoneType -product : NoneType, str -tracks : NoneType - -__init__(query_obj, product, spatial_extent, date_range, cycles, tracks) -generate_OA_parameters(): list -grid_bbox(binsize): list -make_request(base_url, payload) -parallel_request_OA(): da.array -query_icesat2_filelist(): tuple -request_OA_data(paras): da.array -viz_elevation(): (hv.DynamicMap, hv.Layout) + +Visualize + +bbox : list +cycles : NoneType +date_range : NoneType +product : NoneType, str +tracks : NoneType + +__init__(query_obj, product, spatial_extent, date_range, cycles, tracks) +generate_OA_parameters(): list +grid_bbox(binsize): list +make_request(base_url, payload) +parallel_request_OA(): da.array +query_icesat2_filelist(): tuple +request_OA_data(paras): da.array +viz_elevation(): (hv.DynamicMap, hv.Layout) diff --git a/doc/source/user_guide/documentation/classes_user_uml.svg b/doc/source/user_guide/documentation/classes_user_uml.svg index 640f76815..a9c116469 100644 --- a/doc/source/user_guide/documentation/classes_user_uml.svg +++ b/doc/source/user_guide/documentation/classes_user_uml.svg @@ -201,13 +201,14 @@ icepyx.core.read.Read - -Read - -data_source -vars - -load() + +Read + +filelist +product +vars + +load() @@ -300,9 +301,9 @@ icepyx.core.variables.Variables->icepyx.core.read.Read - - -_read_vars + + +_read_vars