diff --git a/README.md b/README.md index 464dfbc1..869a21c1 100644 --- a/README.md +++ b/README.md @@ -1,5 +1,5 @@ # maap-documentation -[![Documentation Status](https://readthedocs.org/projects/maap-project/badge/?version=latest)](https://maap-project.readthedocs.io/en/latest/?badge=latest) +[![Documentation Status](https://readthedocs.org/projects/maap-project/badge/?version=latest)](https://maap-project.readthedocs.io/en/latest/?badge=latest) [![DOI](https://zenodo.org/badge/235617200.svg)](https://zenodo.org/doi/10.5281/zenodo.10499174) This repository serves as the technical documentation for interfacing with the MAAP services. diff --git a/docs/source/_static/faq_images/import_granules.png b/docs/source/_static/faq_images/import_granules.png new file mode 100644 index 00000000..3603350a Binary files /dev/null and b/docs/source/_static/faq_images/import_granules.png differ diff --git a/docs/source/_static/faq_images/import_granules_1.png b/docs/source/_static/faq_images/import_granules_1.png deleted file mode 100644 index 3e6361db..00000000 Binary files a/docs/source/_static/faq_images/import_granules_1.png and /dev/null differ diff --git a/docs/source/_static/jobs_ui_access.png b/docs/source/_static/jobs_ui/jobs_ui_access.png similarity index 100% rename from docs/source/_static/jobs_ui_access.png rename to docs/source/_static/jobs_ui/jobs_ui_access.png diff --git a/docs/source/_static/jobs_ui_copy_code.png b/docs/source/_static/jobs_ui/jobs_ui_copy_code.png similarity index 100% rename from docs/source/_static/jobs_ui_copy_code.png rename to docs/source/_static/jobs_ui/jobs_ui_copy_code.png diff --git a/docs/source/_static/jobs_ui_failed_toast.png b/docs/source/_static/jobs_ui/jobs_ui_failed_toast.png similarity index 100% rename from docs/source/_static/jobs_ui_failed_toast.png rename to docs/source/_static/jobs_ui/jobs_ui_failed_toast.png diff --git a/docs/source/_static/jobs_ui_overview.png b/docs/source/_static/jobs_ui/jobs_ui_overview.png similarity index 100% rename from docs/source/_static/jobs_ui_overview.png rename to docs/source/_static/jobs_ui/jobs_ui_overview.png diff --git a/docs/source/_static/jobs_ui_submit.png b/docs/source/_static/jobs_ui/jobs_ui_submit.png similarity index 100% rename from docs/source/_static/jobs_ui_submit.png rename to docs/source/_static/jobs_ui/jobs_ui_submit.png diff --git a/docs/source/_static/jobs_ui_submit_detail.png b/docs/source/_static/jobs_ui/jobs_ui_submit_detail.png similarity index 100% rename from docs/source/_static/jobs_ui_submit_detail.png rename to docs/source/_static/jobs_ui/jobs_ui_submit_detail.png diff --git a/docs/source/_static/jobs_ui_submit_toast.png b/docs/source/_static/jobs_ui/jobs_ui_submit_toast.png similarity index 100% rename from docs/source/_static/jobs_ui_submit_toast.png rename to docs/source/_static/jobs_ui/jobs_ui_submit_toast.png diff --git a/docs/source/_static/jobs_ui/revoke_failed.png b/docs/source/_static/jobs_ui/revoke_failed.png new file mode 100644 index 00000000..635fddf2 Binary files /dev/null and b/docs/source/_static/jobs_ui/revoke_failed.png differ diff --git a/docs/source/_static/jobs_ui/revoke_job.png b/docs/source/_static/jobs_ui/revoke_job.png new file mode 100644 index 00000000..3cb485e8 Binary files /dev/null and b/docs/source/_static/jobs_ui/revoke_job.png differ diff --git a/docs/source/_static/jobs_ui/revoke_successful.png b/docs/source/_static/jobs_ui/revoke_successful.png new file mode 100644 index 00000000..6dfc96a6 Binary files /dev/null and b/docs/source/_static/jobs_ui/revoke_successful.png differ diff --git a/docs/source/getting_started/_static/storage_options_diagram.png b/docs/source/getting_started/_static/storage_options_diagram.png index bc647e24..179ab90a 100644 Binary files a/docs/source/getting_started/_static/storage_options_diagram.png and b/docs/source/getting_started/_static/storage_options_diagram.png differ diff --git a/docs/source/getting_started/getting_started.ipynb b/docs/source/getting_started/getting_started.ipynb index 36295342..03951a3e 100644 --- a/docs/source/getting_started/getting_started.ipynb +++ b/docs/source/getting_started/getting_started.ipynb @@ -136,8 +136,8 @@ "\n", "#### My root folder (fast cloud storage)\n", " - Your Jupyter home directory (`~`) is mounted to `/projects`. Files in here persist across sessions and exist across your workspaces.\n", - " - Use this for code-related items, smaller data storage\n", - " - Git is more likely to behave predictably here compared to other storage\n", + " - Use this for code-related items, smaller data storage (such as Jupyter Notebooks, Python/ R/ Markdown files, etc.)\n", + " - Git is more likely to behave predictably here compared to other storage \n", " - This is also the place to make persistent conda environments (covered in another section), but make sure to not make a conda env inside a git-tracked folder, or if you do add it to the .gitignore. If git is tracking an env, it could cause your workspace to crash. \n", " - Uses local (to Jupyter) file system; generally faster and more reliable for “normal” file operations, but expensive\n", "\n", @@ -145,12 +145,13 @@ "`~/my-private-bucket` is an S3 bucket with persistent storage, but accessible only to you and others in a shared workspace.\n", " \n", " - Use for large data storage\n", - " - It will be slower than the root folder to copy and move files, which is why it is not ideal for storing smaller files that need to be read or written quickly\n", + " - It will be slower than the root folder to copy and move files, which is why it is not ideal for storing smaller files that need to be read or written quickly (e.g. Jupyter Notebooks)\n", "\n", "#### Sharing files: my-public-bucket and shared-buckets\n", "`~/my-public-bucket` is an S3 bucket with persistent storage. It is the same as `~/shared-buckets//` — anything you put in here will be accessible to other users via `~/shared-buckets/` as a read-only file. Likewise, to find shared files from another user, look in `~/shared-buckets/`.\n", "\n", - " - Use for large data storage for files that you want to share across workspaces\n", + " - Use for large data storage for files that you want to share across workspaces \n", + " - Public and shared buckets are not recommended for Jupyter Notebooks\n", "\n", "![Storage options diagram](_static/storage_options_diagram.png)\n", "\n", @@ -161,9 +162,9 @@ ], "metadata": { "kernelspec": { - "display_name": "Python [conda env:root] *", + "display_name": "Python 3.12.0 64-bit", "language": "python", - "name": "conda-root-py" + "name": "python3" }, "language_info": { "codemirror_mode": { @@ -175,12 +176,17 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.7.8" + "version": "3.12.0" }, "metadata": { "interpreter": { "hash": "31f2aee4e71d21fbe5cf8b01ff0e069b9275f58929596ceb00d14d90e3e16cd6" } + }, + "vscode": { + "interpreter": { + "hash": "7500c3e1c7c786e4ba1e4b4eb7588219b4e35d5153674f92eb3a82672b534f6e" + } } }, "nbformat": 4, diff --git a/docs/source/getting_started/running_at_scale.ipynb b/docs/source/getting_started/running_at_scale.ipynb index 858d0876..c2295829 100644 --- a/docs/source/getting_started/running_at_scale.ipynb +++ b/docs/source/getting_started/running_at_scale.ipynb @@ -80,7 +80,7 @@ "\n", "The Jobs UI will let you run and monitor jobs easily. You can find full documentation in the system reference guide for [the Jobs UI](../system_reference_guide/jobsui.ipynb) or [using maap-py](../system_reference_guide/jobs_maappy.ipynb) with Python in the System Reference Guide FAQs.\n", "\n", - "![job_ui_access](../_static/jobs_ui_access.png)\n", + "![job_ui_access](../_static/jobs_ui/jobs_ui_access.png)\n", "\n", "Some alternative methods of running the job are found below.\n", "\n", diff --git a/docs/source/science/ATL08/ATL08.ipynb b/docs/source/science/ATL08/ATL08.ipynb new file mode 100644 index 00000000..87267e91 --- /dev/null +++ b/docs/source/science/ATL08/ATL08.ipynb @@ -0,0 +1,1394 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "71971df7", + "metadata": {}, + "source": [ + "# ATLAS/ICESat-02 ATL08 Access and Visualize\n", + "\n", + "Author: Sumant Jha (MSFC/USRA), Alex Mandel (DevSeed), Jamison French (DevSeed), Rajat Shinde (UAH), Sheyenne Kirkland (UAH)\n", + "\n", + "Date: March 7, 2024\n", + "\n", + "Description: In this example, we'll walk through accessing ATL08 data using both cloud access and through downloading. We'll then explore the data using `H5py`, `h5Glance`, and `xarray`. Finally, we'll visualize some of the data using `xarray`." + ] + }, + { + "cell_type": "markdown", + "id": "1d840225-f6db-4077-bfa3-94b6921e7265", + "metadata": {}, + "source": [ + "## Run This Notebook\n", + "\n", + "To access and run this tutorial within MAAP's Algorithm Development Environment (ADE), please refer to the [\"Getting started with the MAAP\"](https://docs.maap-project.org/en/latest/getting_started/getting_started.html) section of our documentation.\n", + "\n", + "Disclaimer: This tutorial will use an experimental feature to allow access to the DAAC without using EarthDataLogin. This tutorial will need to be ran within MAAP's ADE to allow this experimental feature to work. Running the tutorial outside of the MAAP ADE will result in errors. Additionally, it is recommended to use the `Pangeo` workspace within the MAAP ADE." + ] + }, + { + "cell_type": "markdown", + "id": "ff8efa52-24ef-42ce-b616-4d259039569e", + "metadata": {}, + "source": [ + "## About the Data\n", + "\n", + "This data set (ATL08) contains along-track heights above the WGS84 ellipsoid (ITRF2014 reference frame) for the ground and canopy surfaces. The canopy and ground surfaces are processed in fixed 100 m data segments, which typically contain more than 100 signal photons. The data were acquired by the Advanced Topographic Laser Altimeter System (ATLAS) instrument on board the Ice, Cloud and land Elevation Satellite-2 (ICESat-2) observatory.\n", + "\n", + "```\n", + "Parameter(s): TERRAIN ELEVATION\n", + "Platform(s):ICESat-2\n", + "Sensor(s): ATLAS\n", + "Data Format(s): HDF5\n", + "Temporal Coverage: 14 October 2018 to present\n", + "Temporal Resolution: 91 day\n", + "Spatial Resolution: Varies\n", + "Spatial Reference System(s): WGS 84 EPSG:4326\n", + "Spatial Coverage: N: 90 S: -90 E: 180 W: -180\n", + "```\n", + "\n", + "(Source: [ATL08 v6 Dataset Landing Page](https://nsidc.org/data/atl08/versions/5))\n" + ] + }, + { + "cell_type": "markdown", + "id": "24b1f8cd-53f1-43f6-b85d-1224576e8605", + "metadata": {}, + "source": [ + "## Additional Resources\n", + "- [Earthdata Search](https://search.earthdata.nasa.gov/search?q=atl08&ff=Available%20in%20Earthdata%20Cloud)\n", + "- [ATL08 v6 User Guide](https://nsidc.org/sites/default/files/documents/user-guide/atl08-v006-userguide.pdf)" + ] + }, + { + "cell_type": "markdown", + "id": "d0c3d7fb-6d7f-4027-9c73-15379dfa9d62", + "metadata": {}, + "source": [ + "## Importing and Installing Packages" + ] + }, + { + "cell_type": "markdown", + "id": "bceb37a2", + "metadata": {}, + "source": [ + "The following example uses several packages. If you do not have the following packages, uncomment the code below:" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "3a9b3e53-c67b-4294-999a-04e7cc2c149c", + "metadata": { + "tags": [] + }, + "outputs": [], + "source": [ + "# !pip install -q h5py h5glance requests fsspec s3fs h5netcdf" + ] + }, + { + "cell_type": "markdown", + "id": "69ee9aed-39a7-42fa-aa85-e5185a7ffc7f", + "metadata": {}, + "source": [ + "Optional download (do not need to download if you're using the Pangeo workspace. Uncomment if using other workspaces):" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "c9665604-ce0e-47b1-b7b9-5648d62a6b2e", + "metadata": {}, + "outputs": [], + "source": [ + "# !pip install -q rioxarray" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "id": "43dc9655", + "metadata": {}, + "outputs": [], + "source": [ + "import os\n", + "import h5py\n", + "from maap.maap import MAAP\n", + "from h5glance import H5Glance\n", + "import requests\n", + "import xarray\n", + "import boto3\n", + "import fsspec" + ] + }, + { + "cell_type": "markdown", + "id": "9a01c263-4b64-4eb5-8844-672456f3fec0", + "metadata": {}, + "source": [ + "## Accessing the Data" + ] + }, + { + "cell_type": "markdown", + "id": "ab76b7e7-408e-45c3-b506-d193cb505aab", + "metadata": {}, + "source": [ + "In this section we'll walk through two different ways to access the data. The first method is to access the data through S3.\n", + "\n", + "The second method is to access it by using `maap-py`, then download the data locally. From there, we will explore some of the data using `h5glance`." + ] + }, + { + "cell_type": "markdown", + "id": "ff2227d4", + "metadata": {}, + "source": [ + "### Example 1: Accessing the Data with S3\n", + "\n", + "We will use role assumption to gain access to the data. To do this, we'll use an experimental feature by setting up a parameter, assuming a role, and get temporary credentials with the assumed role. We'll also set up credentials into fsspec so we can later use `xarray` for data exploration." + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "id": "23c1abf0-0369-4833-85ef-3e556409959a", + "metadata": {}, + "outputs": [], + "source": [ + "def assume_role_credentials(ssm_parameter_name):\n", + " # Create a session using your current credentials\n", + " session = boto3.Session()\n", + "\n", + " # Retrieve the SSM parameter\n", + " ssm = session.client('ssm', \"us-west-2\")\n", + " parameter = ssm.get_parameter(\n", + " Name=ssm_parameter_name, \n", + " WithDecryption=True\n", + " )\n", + " parameter_value = parameter['Parameter']['Value']\n", + "\n", + " # Assume the DAAC access role\n", + " sts = session.client('sts')\n", + " assumed_role_object = sts.assume_role(\n", + " RoleArn=parameter_value,\n", + " RoleSessionName='TutorialSession'\n", + " )\n", + "\n", + " # From the response that contains the assumed role, get the temporary \n", + " # credentials that can be used to make subsequent API calls\n", + " credentials = assumed_role_object['Credentials']\n", + "\n", + " return credentials\n", + "\n", + "def fsspec_access(credentials):\n", + " # Pass assumed role credentials into fsspec\n", + " return fsspec.filesystem(\n", + " \"s3\",\n", + " key=credentials['AccessKeyId'],\n", + " secret=credentials['SecretAccessKey'],\n", + " token=credentials['SessionToken']\n", + " )" + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "id": "9d93b99d-37a3-4f9e-a4e8-4939a8275506", + "metadata": { + "tags": [] + }, + "outputs": [], + "source": [ + "s3_fsspec = fsspec_access(assume_role_credentials(\"/iam/maap-data-reader\"))" + ] + }, + { + "cell_type": "markdown", + "id": "6d45ac1b", + "metadata": {}, + "source": [ + "### Example 2: Download Data Locally" + ] + }, + { + "cell_type": "markdown", + "id": "3ffb06f4", + "metadata": {}, + "source": [ + "We are going to use NASA host which is NASA's Common Metadata Repository (CMR) to search for and download ICESat data. \n", + "ICESat's ATL08 data's concept id can be found on https://search.earthdata.nasa.gov/search and looking for 'ATL08' in the search bar. When you check the metadata associated with your search result, you can get the concept_id associated with below tutorial. In this case, the concept_id is `C2613553260-NSIDC_CPRD`. \n", + "\n", + "For this example, we are going to use granule id of `ATL08_20230816182927_08792008_006_01.h5`. This will be in HDF5 format. \n", + "\n", + "With all this information in hand, we are ready to make a query to cmr.earthdata.nasa.gov using `maap-py`. \n" + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "id": "e87a6048", + "metadata": {}, + "outputs": [], + "source": [ + "maap = MAAP(maap_host='api.maap-project.org')\n", + "\n", + "nasa_host = \"cmr.earthdata.nasa.gov\"\n", + "results = maap.searchGranule(cmr_host=nasa_host,\n", + " concept_id=\"C2613553260-NSIDC_CPRD\",\n", + " readable_granule_name=\"ATL08_20230816182927_08792008_006_01.h5\")" + ] + }, + { + "cell_type": "markdown", + "id": "1b5b0235", + "metadata": {}, + "source": [ + "Let's see how this turned out. Did we get a result?" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "id": "1fff1d07", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "{'concept-id': 'G2800397933-NSIDC_CPRD',\n", + " 'collection-concept-id': 'C2613553260-NSIDC_CPRD',\n", + " 'revision-id': '2',\n", + " 'format': 'application/echo10+xml',\n", + " 'Granule': {'GranuleUR': 'ATL08_20230816182927_08792008_006_01.h5',\n", + " 'InsertTime': '2023-11-11T10:14:36.642Z',\n", + " 'LastUpdate': '2023-11-11T10:14:36.642Z',\n", + " 'Collection': {'DataSetId': 'ATLAS/ICESat-2 L3A Land and Vegetation Height V006'},\n", + " 'DataGranule': {'SizeMBDataGranule': '106.29328060150146',\n", + " 'ProducerGranuleId': 'ATL08_20230816182927_08792008_006_01.h5',\n", + " 'DayNightFlag': 'UNSPECIFIED',\n", + " 'ProductionDateTime': '2023-09-21T19:57:30.000Z'},\n", + " 'Temporal': {'RangeDateTime': {'BeginningDateTime': '2023-08-16T18:29:24.813Z',\n", + " 'EndingDateTime': '2023-08-16T18:36:27.524Z'}},\n", + " 'Spatial': {'HorizontalSpatialDomain': {'Geometry': {'GPolygon': {'Boundary': {'Point': [{'PointLongitude': '-49.71155',\n", + " 'PointLatitude': '-0.55384'},\n", + " {'PointLongitude': '-51.21715', 'PointLatitude': '-15.49643'},\n", + " {'PointLongitude': '-52.36359', 'PointLatitude': '-26.40442'},\n", + " {'PointLongitude': '-52.43242', 'PointLatitude': '-27.04278'},\n", + " {'PointLongitude': '-52.5585', 'PointLatitude': '-27.03176'},\n", + " {'PointLongitude': '-52.48902', 'PointLatitude': '-26.39347'},\n", + " {'PointLongitude': '-51.3338', 'PointLatitude': '-15.48562'},\n", + " {'PointLongitude': '-49.82395', 'PointLatitude': '-0.54264'},\n", + " {'PointLongitude': '-49.76474', 'PointLatitude': '0.04913'},\n", + " {'PointLongitude': '-49.65236', 'PointLatitude': '0.03773'}]}}}}},\n", + " 'OnlineAccessURLs': {'OnlineAccessURL': [{'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-protected/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01.h5',\n", + " 'MimeType': 'application/x-hdf5'},\n", + " {'URL': 's3://nsidc-cumulus-prod-protected/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01.h5',\n", + " 'MimeType': 'application/x-hdf5'}]},\n", + " 'OnlineResources': {'OnlineResource': [{'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-protected/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01.h5.dmrpp',\n", + " 'Type': 'USER SUPPORT',\n", + " 'MimeType': 'application/vnd.opendap.dap4.dmrpp+xml'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01.iso.xml',\n", + " 'Type': 'USER SUPPORT',\n", + " 'MimeType': 'text/xml'},\n", + " {'URL': 's3://nsidc-cumulus-prod-protected/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01.h5.dmrpp',\n", + " 'Type': 'USER SUPPORT',\n", + " 'MimeType': 'application/vnd.opendap.dap4.dmrpp+xml'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01.iso.xml',\n", + " 'Type': 'USER SUPPORT',\n", + " 'MimeType': 'text/xml'},\n", + " {'URL': 'https://opendap.earthdata.nasa.gov/collections/C2613553260-NSIDC_CPRD/granules/ATL08_20230816182927_08792008_006_01.h5',\n", + " 'Type': 'USER SUPPORT'}]},\n", + " 'AssociatedBrowseImageUrls': {'ProviderBrowseUrl': [{'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.default.default1.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.default.default2.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt1l.groundtrack.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt1l.h_canopy_abs.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt1l.h_te_median.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt1l.n_ca_photons.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt1l.n_te_photons.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt1r.groundtrack.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt1r.h_canopy_abs.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt1r.h_te_median.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt1r.n_ca_photons.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt1r.n_te_photons.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt2l.groundtrack.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt2l.h_canopy_abs.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt2l.h_te_median.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt2l.n_ca_photons.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt2l.n_te_photons.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt2r.groundtrack.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt2r.h_canopy_abs.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt2r.h_te_median.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt2r.n_ca_photons.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt2r.n_te_photons.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt3l.groundtrack.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt3l.h_canopy_abs.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt3l.h_te_median.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt3l.n_ca_photons.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt3l.n_te_photons.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt3r.groundtrack.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt3r.h_canopy_abs.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt3r.h_te_median.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt3r.n_ca_photons.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 'https://data.nsidc.earthdatacloud.nasa.gov/nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt3r.n_te_photons.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.default.default1.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.default.default2.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt1l.groundtrack.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt1l.h_canopy_abs.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt1l.h_te_median.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt1l.n_ca_photons.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt1l.n_te_photons.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt1r.groundtrack.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt1r.h_canopy_abs.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt1r.h_te_median.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt1r.n_ca_photons.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt1r.n_te_photons.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt2l.groundtrack.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt2l.h_canopy_abs.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt2l.h_te_median.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt2l.n_ca_photons.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt2l.n_te_photons.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt2r.groundtrack.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt2r.h_canopy_abs.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt2r.h_te_median.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt2r.n_ca_photons.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt2r.n_te_photons.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt3l.groundtrack.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt3l.h_canopy_abs.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt3l.h_te_median.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt3l.n_ca_photons.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt3l.n_te_photons.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt3r.groundtrack.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt3r.h_canopy_abs.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt3r.h_te_median.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt3r.n_ca_photons.jpg',\n", + " 'MimeType': 'image/jpeg'},\n", + " {'URL': 's3://nsidc-cumulus-prod-public/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01_BRW.gt3r.n_te_photons.jpg',\n", + " 'MimeType': 'image/jpeg'}]}}}" + ] + }, + "execution_count": 15, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "data_file = results[0]\n", + "data_file" + ] + }, + { + "cell_type": "markdown", + "id": "163283a5", + "metadata": {}, + "source": [ + "Looks like we did get a result and will be able to learn a lot about it from available metadata. Let's download the HDF file locally.\n", + "\n", + "Establish a temporary directory to store the data file and display the path and filename:" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "id": "419c6e78", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "'./data/ATL08_20230816182927_08792008_006_01.h5'" + ] + }, + "execution_count": 16, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "dataDir = './data'\n", + "if not os.path.exists(dataDir): os.mkdir(dataDir)\n", + "data = data_file.getData(dataDir)\n", + "data" + ] + }, + { + "cell_type": "markdown", + "id": "188a7017-ed15-44f4-8d25-9bfe5ca43524", + "metadata": {}, + "source": [ + "## Exploring the Data\n", + "\n", + "There are two different ways we'll open and look at the data:\n", + "1. Using `xarray`\n", + "2. Using `h5py`" + ] + }, + { + "cell_type": "markdown", + "id": "f424754e-5b2e-4b82-ba94-dead8e39b887", + "metadata": {}, + "source": [ + "### 1. xarray" + ] + }, + { + "cell_type": "markdown", + "id": "fd45311f-64ce-4afc-a664-396e33bdf56f", + "metadata": {}, + "source": [ + "First, let's grab the S3 URL for direct access from our results above." + ] + }, + { + "cell_type": "code", + "execution_count": 17, + "id": "162ed41f", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "'s3://nsidc-cumulus-prod-protected/ATLAS/ATL08/006/2023/08/16/ATL08_20230816182927_08792008_006_01.h5'" + ] + }, + "execution_count": 17, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "s3_url = results[0]['Granule']['OnlineAccessURLs']['OnlineAccessURL'][1]['URL']\n", + "s3_url" + ] + }, + { + "cell_type": "markdown", + "id": "6e2308ef-97c6-40a1-9cc8-2ddf77f5538d", + "metadata": {}, + "source": [ + "Now we can open a specific group within the HDF5 file using `xarray`." + ] + }, + { + "cell_type": "code", + "execution_count": 18, + "id": "6d30ef03-4878-4e9b-beef-b535476db455", + "metadata": { + "tags": [] + }, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "
<xarray.Dataset>\n",
+       "Dimensions:            (delta_time: 18690, ds_geosegments: 5, ds_surf_type: 5)\n",
+       "Coordinates:\n",
+       "  * delta_time         (delta_time) datetime64[ns] 2023-08-16T18:29:24.853128...\n",
+       "    latitude           (delta_time) float32 ...\n",
+       "    longitude          (delta_time) float32 ...\n",
+       "Dimensions without coordinates: ds_geosegments, ds_surf_type\n",
+       "Data variables: (12/41)\n",
+       "    asr                (delta_time) float32 ...\n",
+       "    atlas_pa           (delta_time) float32 ...\n",
+       "    beam_azimuth       (delta_time) float32 ...\n",
+       "    beam_coelev        (delta_time) float32 ...\n",
+       "    brightness_flag    (delta_time) float32 ...\n",
+       "    cloud_flag_atm     (delta_time) float32 ...\n",
+       "    ...                 ...\n",
+       "    snr                (delta_time) float32 ...\n",
+       "    solar_azimuth      (delta_time) float32 ...\n",
+       "    solar_elevation    (delta_time) float32 ...\n",
+       "    surf_type          (delta_time, ds_surf_type) int8 ...\n",
+       "    terrain_flg        (delta_time) float64 ...\n",
+       "    urban_flag         (delta_time) float64 ...\n",
+       "Attributes:\n",
+       "    Description:  Contains data categorized as land at 100 meter intervals.\n",
+       "    data_rate:    Data are stored as aggregates of 100 meters.
" + ], + "text/plain": [ + "\n", + "Dimensions: (delta_time: 18690, ds_geosegments: 5, ds_surf_type: 5)\n", + "Coordinates:\n", + " * delta_time (delta_time) datetime64[ns] 2023-08-16T18:29:24.853128...\n", + " latitude (delta_time) float32 ...\n", + " longitude (delta_time) float32 ...\n", + "Dimensions without coordinates: ds_geosegments, ds_surf_type\n", + "Data variables: (12/41)\n", + " asr (delta_time) float32 ...\n", + " atlas_pa (delta_time) float32 ...\n", + " beam_azimuth (delta_time) float32 ...\n", + " beam_coelev (delta_time) float32 ...\n", + " brightness_flag (delta_time) float32 ...\n", + " cloud_flag_atm (delta_time) float32 ...\n", + " ... ...\n", + " snr (delta_time) float32 ...\n", + " solar_azimuth (delta_time) float32 ...\n", + " solar_elevation (delta_time) float32 ...\n", + " surf_type (delta_time, ds_surf_type) int8 ...\n", + " terrain_flg (delta_time) float64 ...\n", + " urban_flag (delta_time) float64 ...\n", + "Attributes:\n", + " Description: Contains data categorized as land at 100 meter intervals.\n", + " data_rate: Data are stored as aggregates of 100 meters." + ] + }, + "execution_count": 18, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "with s3_fsspec.open(s3_url) as f:\n", + " atl08_track = xarray.open_dataset(f, group='gt1l/land_segments', engine=\"h5netcdf\", phony_dims='sort')\n", + "atl08_track" + ] + }, + { + "cell_type": "markdown", + "id": "11316bbe-637e-46a1-ab06-4f5ac18b0b70", + "metadata": {}, + "source": [ + "### 2. H5py and H5glance\n", + "\n", + "Let's check the available keys and structure of the HDF5 files using `H5py` and `H5glance`. This will use the downloaded file that we saved locally.\n", + "\n", + "Open the file and list the keys:" + ] + }, + { + "cell_type": "code", + "execution_count": 19, + "id": "2bebf474-efdd-44c0-8d1f-74795218712e", + "metadata": { + "tags": [] + }, + "outputs": [ + { + "data": { + "text/plain": [ + "['METADATA',\n", + " 'ancillary_data',\n", + " 'ds_geosegments',\n", + " 'ds_metrics',\n", + " 'ds_surf_type',\n", + " 'gt1l',\n", + " 'gt1r',\n", + " 'gt2l',\n", + " 'gt2r',\n", + " 'gt3l',\n", + " 'gt3r',\n", + " 'orbit_info',\n", + " 'quality_assessment']" + ] + }, + "execution_count": 19, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "atl08_file = h5py.File(data,'r')\n", + "list(atl08_file.keys())" + ] + }, + { + "cell_type": "markdown", + "id": "61a5f601-319a-4836-915d-61ded1d08877", + "metadata": {}, + "source": [ + "Use `H5glance` module to interactively check all available variables and field that can be used for further analysis and visualizations:" + ] + }, + { + "cell_type": "code", + "execution_count": 20, + "id": "639bb2f9-2793-4fda-a803-d1a4cdf139c7", + "metadata": { + "tags": [] + }, + "outputs": [ + { + "data": { + "text/html": [ + "
                                                                        • atl08_region [📋]: 1 entries, dtype: int32
                                                                        • bin_size_h [📋]: 1 entries, dtype: float32
                                                                        • bin_size_n [📋]: 1 entries, dtype: int32
                                                                        • bright_thresh [📋]: 1 entries, dtype: float32
                                                                        • ca_class [📋]: 1 entries, dtype: int32
                                                                        • can_noise_thresh [📋]: 1 entries, dtype: int32
                                                                        • can_stat_thresh [📋]: 1 entries, dtype: float32
                                                                        • canopy20m_thresh [📋]: 1 entries, dtype: int32
                                                                        • canopy_flag_switch [📋]: 1 entries, dtype: int32
                                                                        • canopy_seg [📋]: 1 entries, dtype: int32
                                                                        • class_thresh [📋]: 1 entries, dtype: int32
                                                                        • cloud_filter_switch [📋]: 1 entries, dtype: int32
                                                                        • del_amp [📋]: 1 entries, dtype: float32
                                                                        • del_mu [📋]: 1 entries, dtype: float32
                                                                        • del_sigma [📋]: 1 entries, dtype: float32
                                                                        • dem_filter_switch [📋]: 1 entries, dtype: int32
                                                                        • dem_removal_percent_limit [📋]: 1 entries, dtype: float32
                                                                        • dragann_switch [📋]: 1 entries, dtype: int32
                                                                        • dseg [📋]: 1 entries, dtype: int32
                                                                        • dseg_buf [📋]: 1 entries, dtype: int32
                                                                        • fnlgnd_filter_switch [📋]: 1 entries, dtype: int32
                                                                        • gnd_stat_thresh [📋]: 1 entries, dtype: float32
                                                                        • gthresh_factor [📋]: 1 entries, dtype: float32
                                                                        • h_canopy_perc [📋]: 1 entries, dtype: float32
                                                                        • iter_gnd [📋]: 1 entries, dtype: int32
                                                                        • iter_max [📋]: 1 entries, dtype: int32
                                                                        • lseg [📋]: 1 entries, dtype: int32
                                                                        • lseg_buf [📋]: 1 entries, dtype: int32
                                                                        • lw_filt_bnd [📋]: 1 entries, dtype: int32
                                                                        • lw_gnd_bnd [📋]: 1 entries, dtype: float32
                                                                        • lw_toc_bnd [📋]: 1 entries, dtype: float32
                                                                        • lw_toc_cut [📋]: 1 entries, dtype: float32
                                                                        • max_atl03files [📋]: 1 entries, dtype: int32
                                                                        • max_atl09files [📋]: 1 entries, dtype: int32
                                                                        • max_peaks [📋]: 1 entries, dtype: int32
                                                                        • max_try [📋]: 1 entries, dtype: int32
                                                                        • min_nphs [📋]: 1 entries, dtype: int32
                                                                        • n_dec_mode [📋]: 1 entries, dtype: int32
                                                                        • night_thresh [📋]: 1 entries, dtype: float32
                                                                        • noise_class [📋]: 1 entries, dtype: int32
                                                                        • outlier_filter_switch [📋]: 1 entries, dtype: int32
                                                                        • p_static [📋]: 1 entries, dtype: float32
                                                                        • ph_removal_percent_limit [📋]: 1 entries, dtype: float32
                                                                        • proc_geoseg [📋]: 1 entries, dtype: int32
                                                                        • psf [📋]: 1 entries, dtype: float32
                                                                        • ref_dem_limit [📋]: 1 entries, dtype: float32
                                                                        • ref_finalground_limit [📋]: 1 entries, dtype: float32
                                                                        • relief_hbot [📋]: 1 entries, dtype: float32
                                                                        • relief_htop [📋]: 1 entries, dtype: float32
                                                                        • shp_param [📋]: 1 entries, dtype: float32
                                                                        • sig_rsq_search [📋]: 1 entries, dtype: float32
                                                                        • sseg [📋]: 1 entries, dtype: float32
                                                                        • stat20m_thresh [📋]: 1 entries, dtype: int32
                                                                        • stat_thresh [📋]: 1 entries, dtype: int32
                                                                        • tc_thresh [📋]: 1 entries, dtype: float32
                                                                        • te_class [📋]: 1 entries, dtype: int32
                                                                        • terrain20m_thresh [📋]: 1 entries, dtype: int32
                                                                        • toc_class [📋]: 1 entries, dtype: int32
                                                                        • up_filt_bnd [📋]: 1 entries, dtype: int32
                                                                        • up_gnd_bnd [📋]: 1 entries, dtype: float32
                                                                        • up_toc_bnd [📋]: 1 entries, dtype: float32
                                                                        • up_toc_cut [📋]: 1 entries, dtype: float32
                                                                        • yapc_switch [📋]: 1 entries, dtype: int32
                                                                      • atlas_sdp_gps_epoch [📋]: 1 entries, dtype: float64
                                                                      • control [📋]: 1 entries, dtype: 100000-byte ASCII string
                                                                      • data_end_utc [📋]: 1 entries, dtype: 27-byte ASCII string
                                                                      • data_start_utc [📋]: 1 entries, dtype: 27-byte ASCII string
                                                                      • end_cycle [📋]: 1 entries, dtype: int32
                                                                      • end_delta_time [📋]: 1 entries, dtype: float64
                                                                      • end_geoseg [📋]: 1 entries, dtype: int32
                                                                      • end_gpssow [📋]: 1 entries, dtype: float64
                                                                      • end_gpsweek [📋]: 1 entries, dtype: int32
                                                                      • end_orbit [📋]: 1 entries, dtype: int32
                                                                      • end_region [📋]: 1 entries, dtype: int32
                                                                      • end_rgt [📋]: 1 entries, dtype: int32
                                                                      • granule_end_utc [📋]: 1 entries, dtype: 27-byte ASCII string
                                                                      • granule_start_utc [📋]: 1 entries, dtype: 27-byte ASCII string
                                                                      • qa_at_interval [📋]: 1 entries, dtype: float64
                                                                      • release [📋]: 1 entries, dtype: 80-byte ASCII string
                                                                      • start_cycle [📋]: 1 entries, dtype: int32
                                                                      • start_delta_time [📋]: 1 entries, dtype: float64
                                                                      • start_geoseg [📋]: 1 entries, dtype: int32
                                                                      • start_gpssow [📋]: 1 entries, dtype: float64
                                                                      • start_gpsweek [📋]: 1 entries, dtype: int32
                                                                      • start_orbit [📋]: 1 entries, dtype: int32
                                                                      • start_region [📋]: 1 entries, dtype: int32
                                                                      • start_rgt [📋]: 1 entries, dtype: int32
                                                                      • version [📋]: 1 entries, dtype: 80-byte ASCII string
                                                                          • can_noise [📋]: 18690 entries, dtype: float32
                                                                          • canopy_h_metrics [📋]: 18690 × 18 entries, dtype: float32
                                                                          • canopy_h_metrics_abs [📋]: 18690 × 18 entries, dtype: float32
                                                                          • canopy_openness [📋]: 18690 entries, dtype: float32
                                                                          • canopy_rh_conf [📋]: 18690 entries, dtype: int8
                                                                          • centroid_height [📋]: 18690 entries, dtype: float32
                                                                          • h_canopy [📋]: 18690 entries, dtype: float32
                                                                          • h_canopy_20m [📋]: 18690 × 5 entries, dtype: float32
                                                                          • h_canopy_abs [📋]: 18690 entries, dtype: float32
                                                                          • h_canopy_quad [📋]: 18690 entries, dtype: float32
                                                                          • h_canopy_uncertainty [📋]: 18690 entries, dtype: float32
                                                                          • h_dif_canopy [📋]: 18690 entries, dtype: float32
                                                                          • h_max_canopy [📋]: 18690 entries, dtype: float32
                                                                          • h_max_canopy_abs [📋]: 18690 entries, dtype: float32
                                                                          • h_mean_canopy [📋]: 18690 entries, dtype: float32
                                                                          • h_mean_canopy_abs [📋]: 18690 entries, dtype: float32
                                                                          • h_median_canopy [📋]: 18690 entries, dtype: float32
                                                                          • h_median_canopy_abs [📋]: 18690 entries, dtype: float32
                                                                          • h_min_canopy [📋]: 18690 entries, dtype: float32
                                                                          • h_min_canopy_abs [📋]: 18690 entries, dtype: float32
                                                                          • n_ca_photons [📋]: 18690 entries, dtype: int32
                                                                          • n_toc_photons [📋]: 18690 entries, dtype: int32
                                                                          • photon_rate_can [📋]: 18690 entries, dtype: float32
                                                                          • photon_rate_can_nr [📋]: 18690 entries, dtype: float32
                                                                          • segment_cover [📋]: 18690 entries, dtype: int16
                                                                          • subset_can_flag [📋]: 18690 × 5 entries, dtype: int8
                                                                          • toc_roughness [📋]: 18690 entries, dtype: float32
                                                                          • h_te_best_fit [📋]: 18690 entries, dtype: float32
                                                                          • h_te_best_fit_20m [📋]: 18690 × 5 entries, dtype: float32
                                                                          • h_te_interp [📋]: 18690 entries, dtype: float32
                                                                          • h_te_max [📋]: 18690 entries, dtype: float32
                                                                          • h_te_mean [📋]: 18690 entries, dtype: float32
                                                                          • h_te_median [📋]: 18690 entries, dtype: float32
                                                                          • h_te_min [📋]: 18690 entries, dtype: float32
                                                                          • h_te_mode [📋]: 18690 entries, dtype: float32
                                                                          • h_te_rh25 [📋]: 18690 entries, dtype: float32
                                                                          • h_te_skew [📋]: 18690 entries, dtype: float32
                                                                          • h_te_std [📋]: 18690 entries, dtype: float32
                                                                          • h_te_uncertainty [📋]: 18690 entries, dtype: float32
                                                                          • n_te_photons [📋]: 18690 entries, dtype: int32
                                                                          • photon_rate_te [📋]: 18690 entries, dtype: float32
                                                                          • subset_te_flag [📋]: 18690 × 5 entries, dtype: int8
                                                                          • terrain_slope [📋]: 18690 entries, dtype: float32
                                                                        • asr [📋]: 18690 entries, dtype: float32
                                                                        • atlas_pa [📋]: 18690 entries, dtype: float32
                                                                        • beam_azimuth [📋]: 18690 entries, dtype: float32
                                                                        • beam_coelev [📋]: 18690 entries, dtype: float32
                                                                        • brightness_flag [📋]: 18690 entries, dtype: int8
                                                                        • cloud_flag_atm [📋]: 18690 entries, dtype: int8
                                                                        • cloud_fold_flag [📋]: 18690 entries, dtype: int8
                                                                        • delta_time [📋]: 18690 entries, dtype: float64
                                                                        • delta_time_beg [📋]: 18690 entries, dtype: float64
                                                                        • delta_time_end [📋]: 18690 entries, dtype: float64
                                                                        • dem_flag [📋]: 18690 entries, dtype: int8
                                                                        • dem_h [📋]: 18690 entries, dtype: float32
                                                                        • dem_removal_flag [📋]: 18690 entries, dtype: int8
                                                                        • h_dif_ref [📋]: 18690 entries, dtype: float32
                                                                        • last_seg_extend [📋]: 18690 entries, dtype: float32
                                                                        • latitude [📋]: 18690 entries, dtype: float32
                                                                        • latitude_20m [📋]: 18690 × 5 entries, dtype: float32
                                                                        • layer_flag [📋]: 18690 entries, dtype: int8
                                                                        • longitude [📋]: 18690 entries, dtype: float32
                                                                        • longitude_20m [📋]: 18690 × 5 entries, dtype: float32
                                                                        • msw_flag [📋]: 18690 entries, dtype: int8
                                                                        • n_seg_ph [📋]: 18690 entries, dtype: int32
                                                                        • night_flag [📋]: 18690 entries, dtype: int32
                                                                        • ph_ndx_beg [📋]: 18690 entries, dtype: int64
                                                                        • ph_removal_flag [📋]: 18690 entries, dtype: int8
                                                                        • psf_flag [📋]: 18690 entries, dtype: int8
                                                                        • rgt [📋]: 18690 entries, dtype: int16
                                                                        • sat_flag [📋]: 18690 entries, dtype: int8
                                                                        • segment_id_beg [📋]: 18690 entries, dtype: int32
                                                                        • segment_id_end [📋]: 18690 entries, dtype: int32
                                                                        • segment_landcover [📋]: 18690 entries, dtype: int16
                                                                        • segment_snowcover [📋]: 18690 entries, dtype: int8
                                                                        • segment_watermask [📋]: 18690 entries, dtype: int32
                                                                        • sigma_across [📋]: 18690 entries, dtype: float32
                                                                        • sigma_along [📋]: 18690 entries, dtype: float32
                                                                        • sigma_atlas_land [📋]: 18690 entries, dtype: float32
                                                                        • sigma_h [📋]: 18690 entries, dtype: float32
                                                                        • sigma_topo [📋]: 18690 entries, dtype: float32
                                                                        • snr [📋]: 18690 entries, dtype: float32
                                                                        • solar_azimuth [📋]: 18690 entries, dtype: float32
                                                                        • solar_elevation [📋]: 18690 entries, dtype: float32
                                                                        • surf_type [📋]: 18690 × 5 entries, dtype: int8
                                                                        • terrain_flg [📋]: 18690 entries, dtype: int32
                                                                        • urban_flag [📋]: 18690 entries, dtype: int32
                                                                        • classed_pc_flag [📋]: 4876093 entries, dtype: int8
                                                                        • classed_pc_indx [📋]: 4876093 entries, dtype: int32
                                                                        • d_flag [📋]: 4876093 entries, dtype: int8
                                                                        • delta_time [📋]: 4876093 entries, dtype: float64
                                                                        • ph_h [📋]: 4876093 entries, dtype: float32
                                                                        • ph_segment_id [📋]: 4876093 entries, dtype: int32
                                                                          • can_noise [📋]: 11436 entries, dtype: float32
                                                                          • canopy_h_metrics [📋]: 11436 × 18 entries, dtype: float32
                                                                          • canopy_h_metrics_abs [📋]: 11436 × 18 entries, dtype: float32
                                                                          • canopy_openness [📋]: 11436 entries, dtype: float32
                                                                          • canopy_rh_conf [📋]: 11436 entries, dtype: int8
                                                                          • centroid_height [📋]: 11436 entries, dtype: float32
                                                                          • h_canopy [📋]: 11436 entries, dtype: float32
                                                                          • h_canopy_20m [📋]: 11436 × 5 entries, dtype: float32
                                                                          • h_canopy_abs [📋]: 11436 entries, dtype: float32
                                                                          • h_canopy_quad [📋]: 11436 entries, dtype: float32
                                                                          • h_canopy_uncertainty [📋]: 11436 entries, dtype: float32
                                                                          • h_dif_canopy [📋]: 11436 entries, dtype: float32
                                                                          • h_max_canopy [📋]: 11436 entries, dtype: float32
                                                                          • h_max_canopy_abs [📋]: 11436 entries, dtype: float32
                                                                          • h_mean_canopy [📋]: 11436 entries, dtype: float32
                                                                          • h_mean_canopy_abs [📋]: 11436 entries, dtype: float32
                                                                          • h_median_canopy [📋]: 11436 entries, dtype: float32
                                                                          • h_median_canopy_abs [📋]: 11436 entries, dtype: float32
                                                                          • h_min_canopy [📋]: 11436 entries, dtype: float32
                                                                          • h_min_canopy_abs [📋]: 11436 entries, dtype: float32
                                                                          • n_ca_photons [📋]: 11436 entries, dtype: int32
                                                                          • n_toc_photons [📋]: 11436 entries, dtype: int32
                                                                          • photon_rate_can [📋]: 11436 entries, dtype: float32
                                                                          • photon_rate_can_nr [📋]: 11436 entries, dtype: float32
                                                                          • segment_cover [📋]: 11436 entries, dtype: int16
                                                                          • subset_can_flag [📋]: 11436 × 5 entries, dtype: int8
                                                                          • toc_roughness [📋]: 11436 entries, dtype: float32
                                                                          • h_te_best_fit [📋]: 11436 entries, dtype: float32
                                                                          • h_te_best_fit_20m [📋]: 11436 × 5 entries, dtype: float32
                                                                          • h_te_interp [📋]: 11436 entries, dtype: float32
                                                                          • h_te_max [📋]: 11436 entries, dtype: float32
                                                                          • h_te_mean [📋]: 11436 entries, dtype: float32
                                                                          • h_te_median [📋]: 11436 entries, dtype: float32
                                                                          • h_te_min [📋]: 11436 entries, dtype: float32
                                                                          • h_te_mode [📋]: 11436 entries, dtype: float32
                                                                          • h_te_rh25 [📋]: 11436 entries, dtype: float32
                                                                          • h_te_skew [📋]: 11436 entries, dtype: float32
                                                                          • h_te_std [📋]: 11436 entries, dtype: float32
                                                                          • h_te_uncertainty [📋]: 11436 entries, dtype: float32
                                                                          • n_te_photons [📋]: 11436 entries, dtype: int32
                                                                          • photon_rate_te [📋]: 11436 entries, dtype: float32
                                                                          • subset_te_flag [📋]: 11436 × 5 entries, dtype: int8
                                                                          • terrain_slope [📋]: 11436 entries, dtype: float32
                                                                        • asr [📋]: 11436 entries, dtype: float32
                                                                        • atlas_pa [📋]: 11436 entries, dtype: float32
                                                                        • beam_azimuth [📋]: 11436 entries, dtype: float32
                                                                        • beam_coelev [📋]: 11436 entries, dtype: float32
                                                                        • brightness_flag [📋]: 11436 entries, dtype: int8
                                                                        • cloud_flag_atm [📋]: 11436 entries, dtype: int8
                                                                        • cloud_fold_flag [📋]: 11436 entries, dtype: int8
                                                                        • delta_time [📋]: 11436 entries, dtype: float64
                                                                        • delta_time_beg [📋]: 11436 entries, dtype: float64
                                                                        • delta_time_end [📋]: 11436 entries, dtype: float64
                                                                        • dem_flag [📋]: 11436 entries, dtype: int8
                                                                        • dem_h [📋]: 11436 entries, dtype: float32
                                                                        • dem_removal_flag [📋]: 11436 entries, dtype: int8
                                                                        • h_dif_ref [📋]: 11436 entries, dtype: float32
                                                                        • last_seg_extend [📋]: 11436 entries, dtype: float32
                                                                        • latitude [📋]: 11436 entries, dtype: float32
                                                                        • latitude_20m [📋]: 11436 × 5 entries, dtype: float32
                                                                        • layer_flag [📋]: 11436 entries, dtype: int8
                                                                        • longitude [📋]: 11436 entries, dtype: float32
                                                                        • longitude_20m [📋]: 11436 × 5 entries, dtype: float32
                                                                        • msw_flag [📋]: 11436 entries, dtype: int8
                                                                        • n_seg_ph [📋]: 11436 entries, dtype: int32
                                                                        • night_flag [📋]: 11436 entries, dtype: int32
                                                                        • ph_ndx_beg [📋]: 11436 entries, dtype: int64
                                                                        • ph_removal_flag [📋]: 11436 entries, dtype: int8
                                                                        • psf_flag [📋]: 11436 entries, dtype: int8
                                                                        • rgt [📋]: 11436 entries, dtype: int16
                                                                        • sat_flag [📋]: 11436 entries, dtype: int8
                                                                        • segment_id_beg [📋]: 11436 entries, dtype: int32
                                                                        • segment_id_end [📋]: 11436 entries, dtype: int32
                                                                        • segment_landcover [📋]: 11436 entries, dtype: int16
                                                                        • segment_snowcover [📋]: 11436 entries, dtype: int8
                                                                        • segment_watermask [📋]: 11436 entries, dtype: int32
                                                                        • sigma_across [📋]: 11436 entries, dtype: float32
                                                                        • sigma_along [📋]: 11436 entries, dtype: float32
                                                                        • sigma_atlas_land [📋]: 11436 entries, dtype: float32
                                                                        • sigma_h [📋]: 11436 entries, dtype: float32
                                                                        • sigma_topo [📋]: 11436 entries, dtype: float32
                                                                        • snr [📋]: 11436 entries, dtype: float32
                                                                        • solar_azimuth [📋]: 11436 entries, dtype: float32
                                                                        • solar_elevation [📋]: 11436 entries, dtype: float32
                                                                        • surf_type [📋]: 11436 × 5 entries, dtype: int8
                                                                        • terrain_flg [📋]: 11436 entries, dtype: int32
                                                                        • urban_flag [📋]: 11436 entries, dtype: int32
                                                                        • classed_pc_flag [📋]: 1372978 entries, dtype: int8
                                                                        • classed_pc_indx [📋]: 1372978 entries, dtype: int32
                                                                        • d_flag [📋]: 1372978 entries, dtype: int8
                                                                        • delta_time [📋]: 1372978 entries, dtype: float64
                                                                        • ph_h [📋]: 1372978 entries, dtype: float32
                                                                        • ph_segment_id [📋]: 1372978 entries, dtype: int32
                                                                          • can_noise [📋]: 18612 entries, dtype: float32
                                                                          • canopy_h_metrics [📋]: 18612 × 18 entries, dtype: float32
                                                                          • canopy_h_metrics_abs [📋]: 18612 × 18 entries, dtype: float32
                                                                          • canopy_openness [📋]: 18612 entries, dtype: float32
                                                                          • canopy_rh_conf [📋]: 18612 entries, dtype: int8
                                                                          • centroid_height [📋]: 18612 entries, dtype: float32
                                                                          • h_canopy [📋]: 18612 entries, dtype: float32
                                                                          • h_canopy_20m [📋]: 18612 × 5 entries, dtype: float32
                                                                          • h_canopy_abs [📋]: 18612 entries, dtype: float32
                                                                          • h_canopy_quad [📋]: 18612 entries, dtype: float32
                                                                          • h_canopy_uncertainty [📋]: 18612 entries, dtype: float32
                                                                          • h_dif_canopy [📋]: 18612 entries, dtype: float32
                                                                          • h_max_canopy [📋]: 18612 entries, dtype: float32
                                                                          • h_max_canopy_abs [📋]: 18612 entries, dtype: float32
                                                                          • h_mean_canopy [📋]: 18612 entries, dtype: float32
                                                                          • h_mean_canopy_abs [📋]: 18612 entries, dtype: float32
                                                                          • h_median_canopy [📋]: 18612 entries, dtype: float32
                                                                          • h_median_canopy_abs [📋]: 18612 entries, dtype: float32
                                                                          • h_min_canopy [📋]: 18612 entries, dtype: float32
                                                                          • h_min_canopy_abs [📋]: 18612 entries, dtype: float32
                                                                          • n_ca_photons [📋]: 18612 entries, dtype: int32
                                                                          • n_toc_photons [📋]: 18612 entries, dtype: int32
                                                                          • photon_rate_can [📋]: 18612 entries, dtype: float32
                                                                          • photon_rate_can_nr [📋]: 18612 entries, dtype: float32
                                                                          • segment_cover [📋]: 18612 entries, dtype: int16
                                                                          • subset_can_flag [📋]: 18612 × 5 entries, dtype: int8
                                                                          • toc_roughness [📋]: 18612 entries, dtype: float32
                                                                          • h_te_best_fit [📋]: 18612 entries, dtype: float32
                                                                          • h_te_best_fit_20m [📋]: 18612 × 5 entries, dtype: float32
                                                                          • h_te_interp [📋]: 18612 entries, dtype: float32
                                                                          • h_te_max [📋]: 18612 entries, dtype: float32
                                                                          • h_te_mean [📋]: 18612 entries, dtype: float32
                                                                          • h_te_median [📋]: 18612 entries, dtype: float32
                                                                          • h_te_min [📋]: 18612 entries, dtype: float32
                                                                          • h_te_mode [📋]: 18612 entries, dtype: float32
                                                                          • h_te_rh25 [📋]: 18612 entries, dtype: float32
                                                                          • h_te_skew [📋]: 18612 entries, dtype: float32
                                                                          • h_te_std [📋]: 18612 entries, dtype: float32
                                                                          • h_te_uncertainty [📋]: 18612 entries, dtype: float32
                                                                          • n_te_photons [📋]: 18612 entries, dtype: int32
                                                                          • photon_rate_te [📋]: 18612 entries, dtype: float32
                                                                          • subset_te_flag [📋]: 18612 × 5 entries, dtype: int8
                                                                          • terrain_slope [📋]: 18612 entries, dtype: float32
                                                                        • asr [📋]: 18612 entries, dtype: float32
                                                                        • atlas_pa [📋]: 18612 entries, dtype: float32
                                                                        • beam_azimuth [📋]: 18612 entries, dtype: float32
                                                                        • beam_coelev [📋]: 18612 entries, dtype: float32
                                                                        • brightness_flag [📋]: 18612 entries, dtype: int8
                                                                        • cloud_flag_atm [📋]: 18612 entries, dtype: int8
                                                                        • cloud_fold_flag [📋]: 18612 entries, dtype: int8
                                                                        • delta_time [📋]: 18612 entries, dtype: float64
                                                                        • delta_time_beg [📋]: 18612 entries, dtype: float64
                                                                        • delta_time_end [📋]: 18612 entries, dtype: float64
                                                                        • dem_flag [📋]: 18612 entries, dtype: int8
                                                                        • dem_h [📋]: 18612 entries, dtype: float32
                                                                        • dem_removal_flag [📋]: 18612 entries, dtype: int8
                                                                        • h_dif_ref [📋]: 18612 entries, dtype: float32
                                                                        • last_seg_extend [📋]: 18612 entries, dtype: float32
                                                                        • latitude [📋]: 18612 entries, dtype: float32
                                                                        • latitude_20m [📋]: 18612 × 5 entries, dtype: float32
                                                                        • layer_flag [📋]: 18612 entries, dtype: int8
                                                                        • longitude [📋]: 18612 entries, dtype: float32
                                                                        • longitude_20m [📋]: 18612 × 5 entries, dtype: float32
                                                                        • msw_flag [📋]: 18612 entries, dtype: int8
                                                                        • n_seg_ph [📋]: 18612 entries, dtype: int32
                                                                        • night_flag [📋]: 18612 entries, dtype: int32
                                                                        • ph_ndx_beg [📋]: 18612 entries, dtype: int64
                                                                        • ph_removal_flag [📋]: 18612 entries, dtype: int8
                                                                        • psf_flag [📋]: 18612 entries, dtype: int8
                                                                        • rgt [📋]: 18612 entries, dtype: int16
                                                                        • sat_flag [📋]: 18612 entries, dtype: int8
                                                                        • segment_id_beg [📋]: 18612 entries, dtype: int32
                                                                        • segment_id_end [📋]: 18612 entries, dtype: int32
                                                                        • segment_landcover [📋]: 18612 entries, dtype: int16
                                                                        • segment_snowcover [📋]: 18612 entries, dtype: int8
                                                                        • segment_watermask [📋]: 18612 entries, dtype: int32
                                                                        • sigma_across [📋]: 18612 entries, dtype: float32
                                                                        • sigma_along [📋]: 18612 entries, dtype: float32
                                                                        • sigma_atlas_land [📋]: 18612 entries, dtype: float32
                                                                        • sigma_h [📋]: 18612 entries, dtype: float32
                                                                        • sigma_topo [📋]: 18612 entries, dtype: float32
                                                                        • snr [📋]: 18612 entries, dtype: float32
                                                                        • solar_azimuth [📋]: 18612 entries, dtype: float32
                                                                        • solar_elevation [📋]: 18612 entries, dtype: float32
                                                                        • surf_type [📋]: 18612 × 5 entries, dtype: int8
                                                                        • terrain_flg [📋]: 18612 entries, dtype: int32
                                                                        • urban_flag [📋]: 18612 entries, dtype: int32
                                                                        • classed_pc_flag [📋]: 3117451 entries, dtype: int8
                                                                        • classed_pc_indx [📋]: 3117451 entries, dtype: int32
                                                                        • d_flag [📋]: 3117451 entries, dtype: int8
                                                                        • delta_time [📋]: 3117451 entries, dtype: float64
                                                                        • ph_h [📋]: 3117451 entries, dtype: float32
                                                                        • ph_segment_id [📋]: 3117451 entries, dtype: int32
                                                                          • can_noise [📋]: 10243 entries, dtype: float32
                                                                          • canopy_h_metrics [📋]: 10243 × 18 entries, dtype: float32
                                                                          • canopy_h_metrics_abs [📋]: 10243 × 18 entries, dtype: float32
                                                                          • canopy_openness [📋]: 10243 entries, dtype: float32
                                                                          • canopy_rh_conf [📋]: 10243 entries, dtype: int8
                                                                          • centroid_height [📋]: 10243 entries, dtype: float32
                                                                          • h_canopy [📋]: 10243 entries, dtype: float32
                                                                          • h_canopy_20m [📋]: 10243 × 5 entries, dtype: float32
                                                                          • h_canopy_abs [📋]: 10243 entries, dtype: float32
                                                                          • h_canopy_quad [📋]: 10243 entries, dtype: float32
                                                                          • h_canopy_uncertainty [📋]: 10243 entries, dtype: float32
                                                                          • h_dif_canopy [📋]: 10243 entries, dtype: float32
                                                                          • h_max_canopy [📋]: 10243 entries, dtype: float32
                                                                          • h_max_canopy_abs [📋]: 10243 entries, dtype: float32
                                                                          • h_mean_canopy [📋]: 10243 entries, dtype: float32
                                                                          • h_mean_canopy_abs [📋]: 10243 entries, dtype: float32
                                                                          • h_median_canopy [📋]: 10243 entries, dtype: float32
                                                                          • h_median_canopy_abs [📋]: 10243 entries, dtype: float32
                                                                          • h_min_canopy [📋]: 10243 entries, dtype: float32
                                                                          • h_min_canopy_abs [📋]: 10243 entries, dtype: float32
                                                                          • n_ca_photons [📋]: 10243 entries, dtype: int32
                                                                          • n_toc_photons [📋]: 10243 entries, dtype: int32
                                                                          • photon_rate_can [📋]: 10243 entries, dtype: float32
                                                                          • photon_rate_can_nr [📋]: 10243 entries, dtype: float32
                                                                          • segment_cover [📋]: 10243 entries, dtype: int16
                                                                          • subset_can_flag [📋]: 10243 × 5 entries, dtype: int8
                                                                          • toc_roughness [📋]: 10243 entries, dtype: float32
                                                                          • h_te_best_fit [📋]: 10243 entries, dtype: float32
                                                                          • h_te_best_fit_20m [📋]: 10243 × 5 entries, dtype: float32
                                                                          • h_te_interp [📋]: 10243 entries, dtype: float32
                                                                          • h_te_max [📋]: 10243 entries, dtype: float32
                                                                          • h_te_mean [📋]: 10243 entries, dtype: float32
                                                                          • h_te_median [📋]: 10243 entries, dtype: float32
                                                                          • h_te_min [📋]: 10243 entries, dtype: float32
                                                                          • h_te_mode [📋]: 10243 entries, dtype: float32
                                                                          • h_te_rh25 [📋]: 10243 entries, dtype: float32
                                                                          • h_te_skew [📋]: 10243 entries, dtype: float32
                                                                          • h_te_std [📋]: 10243 entries, dtype: float32
                                                                          • h_te_uncertainty [📋]: 10243 entries, dtype: float32
                                                                          • n_te_photons [📋]: 10243 entries, dtype: int32
                                                                          • photon_rate_te [📋]: 10243 entries, dtype: float32
                                                                          • subset_te_flag [📋]: 10243 × 5 entries, dtype: int8
                                                                          • terrain_slope [📋]: 10243 entries, dtype: float32
                                                                        • asr [📋]: 10243 entries, dtype: float32
                                                                        • atlas_pa [📋]: 10243 entries, dtype: float32
                                                                        • beam_azimuth [📋]: 10243 entries, dtype: float32
                                                                        • beam_coelev [📋]: 10243 entries, dtype: float32
                                                                        • brightness_flag [📋]: 10243 entries, dtype: int8
                                                                        • cloud_flag_atm [📋]: 10243 entries, dtype: int8
                                                                        • cloud_fold_flag [📋]: 10243 entries, dtype: int8
                                                                        • delta_time [📋]: 10243 entries, dtype: float64
                                                                        • delta_time_beg [📋]: 10243 entries, dtype: float64
                                                                        • delta_time_end [📋]: 10243 entries, dtype: float64
                                                                        • dem_flag [📋]: 10243 entries, dtype: int8
                                                                        • dem_h [📋]: 10243 entries, dtype: float32
                                                                        • dem_removal_flag [📋]: 10243 entries, dtype: int8
                                                                        • h_dif_ref [📋]: 10243 entries, dtype: float32
                                                                        • last_seg_extend [📋]: 10243 entries, dtype: float32
                                                                        • latitude [📋]: 10243 entries, dtype: float32
                                                                        • latitude_20m [📋]: 10243 × 5 entries, dtype: float32
                                                                        • layer_flag [📋]: 10243 entries, dtype: int8
                                                                        • longitude [📋]: 10243 entries, dtype: float32
                                                                        • longitude_20m [📋]: 10243 × 5 entries, dtype: float32
                                                                        • msw_flag [📋]: 10243 entries, dtype: int8
                                                                        • n_seg_ph [📋]: 10243 entries, dtype: int32
                                                                        • night_flag [📋]: 10243 entries, dtype: int32
                                                                        • ph_ndx_beg [📋]: 10243 entries, dtype: int64
                                                                        • ph_removal_flag [📋]: 10243 entries, dtype: int8
                                                                        • psf_flag [📋]: 10243 entries, dtype: int8
                                                                        • rgt [📋]: 10243 entries, dtype: int16
                                                                        • sat_flag [📋]: 10243 entries, dtype: int8
                                                                        • segment_id_beg [📋]: 10243 entries, dtype: int32
                                                                        • segment_id_end [📋]: 10243 entries, dtype: int32
                                                                        • segment_landcover [📋]: 10243 entries, dtype: int16
                                                                        • segment_snowcover [📋]: 10243 entries, dtype: int8
                                                                        • segment_watermask [📋]: 10243 entries, dtype: int32
                                                                        • sigma_across [📋]: 10243 entries, dtype: float32
                                                                        • sigma_along [📋]: 10243 entries, dtype: float32
                                                                        • sigma_atlas_land [📋]: 10243 entries, dtype: float32
                                                                        • sigma_h [📋]: 10243 entries, dtype: float32
                                                                        • sigma_topo [📋]: 10243 entries, dtype: float32
                                                                        • snr [📋]: 10243 entries, dtype: float32
                                                                        • solar_azimuth [📋]: 10243 entries, dtype: float32
                                                                        • solar_elevation [📋]: 10243 entries, dtype: float32
                                                                        • surf_type [📋]: 10243 × 5 entries, dtype: int8
                                                                        • terrain_flg [📋]: 10243 entries, dtype: int32
                                                                        • urban_flag [📋]: 10243 entries, dtype: int32
                                                                        • classed_pc_flag [📋]: 1107244 entries, dtype: int8
                                                                        • classed_pc_indx [📋]: 1107244 entries, dtype: int32
                                                                        • d_flag [📋]: 1107244 entries, dtype: int8
                                                                        • delta_time [📋]: 1107244 entries, dtype: float64
                                                                        • ph_h [📋]: 1107244 entries, dtype: float32
                                                                        • ph_segment_id [📋]: 1107244 entries, dtype: int32
                                                                          • can_noise [📋]: 19575 entries, dtype: float32
                                                                          • canopy_h_metrics [📋]: 19575 × 18 entries, dtype: float32
                                                                          • canopy_h_metrics_abs [📋]: 19575 × 18 entries, dtype: float32
                                                                          • canopy_openness [📋]: 19575 entries, dtype: float32
                                                                          • canopy_rh_conf [📋]: 19575 entries, dtype: int8
                                                                          • centroid_height [📋]: 19575 entries, dtype: float32
                                                                          • h_canopy [📋]: 19575 entries, dtype: float32
                                                                          • h_canopy_20m [📋]: 19575 × 5 entries, dtype: float32
                                                                          • h_canopy_abs [📋]: 19575 entries, dtype: float32
                                                                          • h_canopy_quad [📋]: 19575 entries, dtype: float32
                                                                          • h_canopy_uncertainty [📋]: 19575 entries, dtype: float32
                                                                          • h_dif_canopy [📋]: 19575 entries, dtype: float32
                                                                          • h_max_canopy [📋]: 19575 entries, dtype: float32
                                                                          • h_max_canopy_abs [📋]: 19575 entries, dtype: float32
                                                                          • h_mean_canopy [📋]: 19575 entries, dtype: float32
                                                                          • h_mean_canopy_abs [📋]: 19575 entries, dtype: float32
                                                                          • h_median_canopy [📋]: 19575 entries, dtype: float32
                                                                          • h_median_canopy_abs [📋]: 19575 entries, dtype: float32
                                                                          • h_min_canopy [📋]: 19575 entries, dtype: float32
                                                                          • h_min_canopy_abs [📋]: 19575 entries, dtype: float32
                                                                          • n_ca_photons [📋]: 19575 entries, dtype: int32
                                                                          • n_toc_photons [📋]: 19575 entries, dtype: int32
                                                                          • photon_rate_can [📋]: 19575 entries, dtype: float32
                                                                          • photon_rate_can_nr [📋]: 19575 entries, dtype: float32
                                                                          • segment_cover [📋]: 19575 entries, dtype: int16
                                                                          • subset_can_flag [📋]: 19575 × 5 entries, dtype: int8
                                                                          • toc_roughness [📋]: 19575 entries, dtype: float32
                                                                          • h_te_best_fit [📋]: 19575 entries, dtype: float32
                                                                          • h_te_best_fit_20m [📋]: 19575 × 5 entries, dtype: float32
                                                                          • h_te_interp [📋]: 19575 entries, dtype: float32
                                                                          • h_te_max [📋]: 19575 entries, dtype: float32
                                                                          • h_te_mean [📋]: 19575 entries, dtype: float32
                                                                          • h_te_median [📋]: 19575 entries, dtype: float32
                                                                          • h_te_min [📋]: 19575 entries, dtype: float32
                                                                          • h_te_mode [📋]: 19575 entries, dtype: float32
                                                                          • h_te_rh25 [📋]: 19575 entries, dtype: float32
                                                                          • h_te_skew [📋]: 19575 entries, dtype: float32
                                                                          • h_te_std [📋]: 19575 entries, dtype: float32
                                                                          • h_te_uncertainty [📋]: 19575 entries, dtype: float32
                                                                          • n_te_photons [📋]: 19575 entries, dtype: int32
                                                                          • photon_rate_te [📋]: 19575 entries, dtype: float32
                                                                          • subset_te_flag [📋]: 19575 × 5 entries, dtype: int8
                                                                          • terrain_slope [📋]: 19575 entries, dtype: float32
                                                                        • asr [📋]: 19575 entries, dtype: float32
                                                                        • atlas_pa [📋]: 19575 entries, dtype: float32
                                                                        • beam_azimuth [📋]: 19575 entries, dtype: float32
                                                                        • beam_coelev [📋]: 19575 entries, dtype: float32
                                                                        • brightness_flag [📋]: 19575 entries, dtype: int8
                                                                        • cloud_flag_atm [📋]: 19575 entries, dtype: int8
                                                                        • cloud_fold_flag [📋]: 19575 entries, dtype: int8
                                                                        • delta_time [📋]: 19575 entries, dtype: float64
                                                                        • delta_time_beg [📋]: 19575 entries, dtype: float64
                                                                        • delta_time_end [📋]: 19575 entries, dtype: float64
                                                                        • dem_flag [📋]: 19575 entries, dtype: int8
                                                                        • dem_h [📋]: 19575 entries, dtype: float32
                                                                        • dem_removal_flag [📋]: 19575 entries, dtype: int8
                                                                        • h_dif_ref [📋]: 19575 entries, dtype: float32
                                                                        • last_seg_extend [📋]: 19575 entries, dtype: float32
                                                                        • latitude [📋]: 19575 entries, dtype: float32
                                                                        • latitude_20m [📋]: 19575 × 5 entries, dtype: float32
                                                                        • layer_flag [📋]: 19575 entries, dtype: int8
                                                                        • longitude [📋]: 19575 entries, dtype: float32
                                                                        • longitude_20m [📋]: 19575 × 5 entries, dtype: float32
                                                                        • msw_flag [📋]: 19575 entries, dtype: int8
                                                                        • n_seg_ph [📋]: 19575 entries, dtype: int32
                                                                        • night_flag [📋]: 19575 entries, dtype: int32
                                                                        • ph_ndx_beg [📋]: 19575 entries, dtype: int64
                                                                        • ph_removal_flag [📋]: 19575 entries, dtype: int8
                                                                        • psf_flag [📋]: 19575 entries, dtype: int8
                                                                        • rgt [📋]: 19575 entries, dtype: int16
                                                                        • sat_flag [📋]: 19575 entries, dtype: int8
                                                                        • segment_id_beg [📋]: 19575 entries, dtype: int32
                                                                        • segment_id_end [📋]: 19575 entries, dtype: int32
                                                                        • segment_landcover [📋]: 19575 entries, dtype: int16
                                                                        • segment_snowcover [📋]: 19575 entries, dtype: int8
                                                                        • segment_watermask [📋]: 19575 entries, dtype: int32
                                                                        • sigma_across [📋]: 19575 entries, dtype: float32
                                                                        • sigma_along [📋]: 19575 entries, dtype: float32
                                                                        • sigma_atlas_land [📋]: 19575 entries, dtype: float32
                                                                        • sigma_h [📋]: 19575 entries, dtype: float32
                                                                        • sigma_topo [📋]: 19575 entries, dtype: float32
                                                                        • snr [📋]: 19575 entries, dtype: float32
                                                                        • solar_azimuth [📋]: 19575 entries, dtype: float32
                                                                        • solar_elevation [📋]: 19575 entries, dtype: float32
                                                                        • surf_type [📋]: 19575 × 5 entries, dtype: int8
                                                                        • terrain_flg [📋]: 19575 entries, dtype: int32
                                                                        • urban_flag [📋]: 19575 entries, dtype: int32
                                                                        • classed_pc_flag [📋]: 3880512 entries, dtype: int8
                                                                        • classed_pc_indx [📋]: 3880512 entries, dtype: int32
                                                                        • d_flag [📋]: 3880512 entries, dtype: int8
                                                                        • delta_time [📋]: 3880512 entries, dtype: float64
                                                                        • ph_h [📋]: 3880512 entries, dtype: float32
                                                                        • ph_segment_id [📋]: 3880512 entries, dtype: int32
                                                                          • can_noise [📋]: 10803 entries, dtype: float32
                                                                          • canopy_h_metrics [📋]: 10803 × 18 entries, dtype: float32
                                                                          • canopy_h_metrics_abs [📋]: 10803 × 18 entries, dtype: float32
                                                                          • canopy_openness [📋]: 10803 entries, dtype: float32
                                                                          • canopy_rh_conf [📋]: 10803 entries, dtype: int8
                                                                          • centroid_height [📋]: 10803 entries, dtype: float32
                                                                          • h_canopy [📋]: 10803 entries, dtype: float32
                                                                          • h_canopy_20m [📋]: 10803 × 5 entries, dtype: float32
                                                                          • h_canopy_abs [📋]: 10803 entries, dtype: float32
                                                                          • h_canopy_quad [📋]: 10803 entries, dtype: float32
                                                                          • h_canopy_uncertainty [📋]: 10803 entries, dtype: float32
                                                                          • h_dif_canopy [📋]: 10803 entries, dtype: float32
                                                                          • h_max_canopy [📋]: 10803 entries, dtype: float32
                                                                          • h_max_canopy_abs [📋]: 10803 entries, dtype: float32
                                                                          • h_mean_canopy [📋]: 10803 entries, dtype: float32
                                                                          • h_mean_canopy_abs [📋]: 10803 entries, dtype: float32
                                                                          • h_median_canopy [📋]: 10803 entries, dtype: float32
                                                                          • h_median_canopy_abs [📋]: 10803 entries, dtype: float32
                                                                          • h_min_canopy [📋]: 10803 entries, dtype: float32
                                                                          • h_min_canopy_abs [📋]: 10803 entries, dtype: float32
                                                                          • n_ca_photons [📋]: 10803 entries, dtype: int32
                                                                          • n_toc_photons [📋]: 10803 entries, dtype: int32
                                                                          • photon_rate_can [📋]: 10803 entries, dtype: float32
                                                                          • photon_rate_can_nr [📋]: 10803 entries, dtype: float32
                                                                          • segment_cover [📋]: 10803 entries, dtype: int16
                                                                          • subset_can_flag [📋]: 10803 × 5 entries, dtype: int8
                                                                          • toc_roughness [📋]: 10803 entries, dtype: float32
                                                                          • h_te_best_fit [📋]: 10803 entries, dtype: float32
                                                                          • h_te_best_fit_20m [📋]: 10803 × 5 entries, dtype: float32
                                                                          • h_te_interp [📋]: 10803 entries, dtype: float32
                                                                          • h_te_max [📋]: 10803 entries, dtype: float32
                                                                          • h_te_mean [📋]: 10803 entries, dtype: float32
                                                                          • h_te_median [📋]: 10803 entries, dtype: float32
                                                                          • h_te_min [📋]: 10803 entries, dtype: float32
                                                                          • h_te_mode [📋]: 10803 entries, dtype: float32
                                                                          • h_te_rh25 [📋]: 10803 entries, dtype: float32
                                                                          • h_te_skew [📋]: 10803 entries, dtype: float32
                                                                          • h_te_std [📋]: 10803 entries, dtype: float32
                                                                          • h_te_uncertainty [📋]: 10803 entries, dtype: float32
                                                                          • n_te_photons [📋]: 10803 entries, dtype: int32
                                                                          • photon_rate_te [📋]: 10803 entries, dtype: float32
                                                                          • subset_te_flag [📋]: 10803 × 5 entries, dtype: int8
                                                                          • terrain_slope [📋]: 10803 entries, dtype: float32
                                                                        • asr [📋]: 10803 entries, dtype: float32
                                                                        • atlas_pa [📋]: 10803 entries, dtype: float32
                                                                        • beam_azimuth [📋]: 10803 entries, dtype: float32
                                                                        • beam_coelev [📋]: 10803 entries, dtype: float32
                                                                        • brightness_flag [📋]: 10803 entries, dtype: int8
                                                                        • cloud_flag_atm [📋]: 10803 entries, dtype: int8
                                                                        • cloud_fold_flag [📋]: 10803 entries, dtype: int8
                                                                        • delta_time [📋]: 10803 entries, dtype: float64
                                                                        • delta_time_beg [📋]: 10803 entries, dtype: float64
                                                                        • delta_time_end [📋]: 10803 entries, dtype: float64
                                                                        • dem_flag [📋]: 10803 entries, dtype: int8
                                                                        • dem_h [📋]: 10803 entries, dtype: float32
                                                                        • dem_removal_flag [📋]: 10803 entries, dtype: int8
                                                                        • h_dif_ref [📋]: 10803 entries, dtype: float32
                                                                        • last_seg_extend [📋]: 10803 entries, dtype: float32
                                                                        • latitude [📋]: 10803 entries, dtype: float32
                                                                        • latitude_20m [📋]: 10803 × 5 entries, dtype: float32
                                                                        • layer_flag [📋]: 10803 entries, dtype: int8
                                                                        • longitude [📋]: 10803 entries, dtype: float32
                                                                        • longitude_20m [📋]: 10803 × 5 entries, dtype: float32
                                                                        • msw_flag [📋]: 10803 entries, dtype: int8
                                                                        • n_seg_ph [📋]: 10803 entries, dtype: int32
                                                                        • night_flag [📋]: 10803 entries, dtype: int32
                                                                        • ph_ndx_beg [📋]: 10803 entries, dtype: int64
                                                                        • ph_removal_flag [📋]: 10803 entries, dtype: int8
                                                                        • psf_flag [📋]: 10803 entries, dtype: int8
                                                                        • rgt [📋]: 10803 entries, dtype: int16
                                                                        • sat_flag [📋]: 10803 entries, dtype: int8
                                                                        • segment_id_beg [📋]: 10803 entries, dtype: int32
                                                                        • segment_id_end [📋]: 10803 entries, dtype: int32
                                                                        • segment_landcover [📋]: 10803 entries, dtype: int16
                                                                        • segment_snowcover [📋]: 10803 entries, dtype: int8
                                                                        • segment_watermask [📋]: 10803 entries, dtype: int32
                                                                        • sigma_across [📋]: 10803 entries, dtype: float32
                                                                        • sigma_along [📋]: 10803 entries, dtype: float32
                                                                        • sigma_atlas_land [📋]: 10803 entries, dtype: float32
                                                                        • sigma_h [📋]: 10803 entries, dtype: float32
                                                                        • sigma_topo [📋]: 10803 entries, dtype: float32
                                                                        • snr [📋]: 10803 entries, dtype: float32
                                                                        • solar_azimuth [📋]: 10803 entries, dtype: float32
                                                                        • solar_elevation [📋]: 10803 entries, dtype: float32
                                                                        • surf_type [📋]: 10803 × 5 entries, dtype: int8
                                                                        • terrain_flg [📋]: 10803 entries, dtype: int32
                                                                        • urban_flag [📋]: 10803 entries, dtype: int32
                                                                        • classed_pc_flag [📋]: 1146212 entries, dtype: int8
                                                                        • classed_pc_indx [📋]: 1146212 entries, dtype: int32
                                                                        • d_flag [📋]: 1146212 entries, dtype: int8
                                                                        • delta_time [📋]: 1146212 entries, dtype: float64
                                                                        • ph_h [📋]: 1146212 entries, dtype: float32
                                                                        • ph_segment_id [📋]: 1146212 entries, dtype: int32
                                                                      • bounding_polygon_lat1 [📋]: 11 entries, dtype: float64
                                                                      • bounding_polygon_lon1 [📋]: 11 entries, dtype: float64
                                                                      • crossing_time [📋]: 1 entries, dtype: float64
                                                                      • cycle_number [📋]: 1 entries, dtype: int8
                                                                      • lan [📋]: 1 entries, dtype: float64
                                                                      • orbit_number [📋]: 1 entries, dtype: uint16
                                                                      • rgt [📋]: 1 entries, dtype: int16
                                                                      • sc_orient [📋]: 1 entries, dtype: int8
                                                                      • sc_orient_time [📋]: 1 entries, dtype: float64
                                                                      • qa_granule_fail_reason [📋]: 1 entries, dtype: int32
                                                                      • qa_granule_pass_fail [📋]: 1 entries, dtype: int32
                                                                    • ds_geosegments [📋]: 5 entries, dtype: int8
                                                                    • ds_metrics [📋]: 18 entries, dtype: int8
                                                                    • ds_surf_type [📋]: 5 entries, dtype: int32
                                                                  " + ], + "text/plain": [ + "./data/ATL08_20230816182927_08792008_006_01.h5/ (47 attributes)\n", + "├METADATA\t(9 children) (3 attributes)\n", + "├ancillary_data\t(26 children) (2 attributes)\n", + "├ds_geosegments\t[int8: 5] (12 attributes)\n", + "├ds_metrics\t[int8: 18] (12 attributes)\n", + "├ds_surf_type\t[int32: 5] (12 attributes)\n", + "├gt1l\t(2 children) (7 attributes)\n", + "├gt1r\t(2 children) (7 attributes)\n", + "├gt2l\t(2 children) (7 attributes)\n", + "├gt2r\t(2 children) (7 attributes)\n", + "├gt3l\t(2 children) (7 attributes)\n", + "├gt3r\t(2 children) (7 attributes)\n", + "├orbit_info\t(9 children) (2 attributes)\n", + "└quality_assessment\t(2 children) (1 attributes)" + ] + }, + "execution_count": 20, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "H5Glance(atl08_file)" + ] + }, + { + "cell_type": "markdown", + "id": "1cac457a-515d-4024-8d16-7ab9e62e3237", + "metadata": {}, + "source": [ + "## Visualizing the Data\n", + "\n", + "By looking at the data variables, we can also create a visualization using `xarray`. Let's plot elevation:" + ] + }, + { + "cell_type": "code", + "execution_count": 21, + "id": "a3decea5-672f-4c74-9e52-a8d11a3ed335", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "\n", + "Dimensions: (delta_time: 18690, ds_geosegments: 5, ds_surf_type: 5)\n", + "Coordinates:\n", + " * delta_time (delta_time) datetime64[ns] 2023-08-16T18:29:24.853128...\n", + " latitude (delta_time) float32 ...\n", + " longitude (delta_time) float32 ...\n", + "Dimensions without coordinates: ds_geosegments, ds_surf_type\n", + "Data variables: (12/41)\n", + " asr (delta_time) float32 ...\n", + " atlas_pa (delta_time) float32 ...\n", + " beam_azimuth (delta_time) float32 ...\n", + " beam_coelev (delta_time) float32 ...\n", + " brightness_flag (delta_time) float32 ...\n", + " cloud_flag_atm (delta_time) float32 ...\n", + " ... ...\n", + " snr (delta_time) float32 ...\n", + " solar_azimuth (delta_time) float32 ...\n", + " solar_elevation (delta_time) float32 ...\n", + " surf_type (delta_time, ds_surf_type) int8 ...\n", + " terrain_flg (delta_time) float64 ...\n", + " urban_flag (delta_time) float64 ...\n", + "Attributes:\n", + " Description: Contains data categorized as land at 100 meter intervals.\n", + " data_rate: Data are stored as aggregates of 100 meters.\n" + ] + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
                                                                  " + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "with s3_fsspec.open(s3_url) as f:\n", + " atl08_track = xarray.open_dataset(f, group='gt1l/land_segments', engine=\"h5netcdf\", phony_dims='sort')\n", + " print(atl08_track)\n", + " atl08_track.dem_h.plot()" + ] + }, + { + "cell_type": "markdown", + "id": "dec4d2fc-7a93-419e-9996-4d8d20a8a892", + "metadata": { + "tags": [] + }, + "source": [ + "If we want to plot canopy height, we can also do that:" + ] + }, + { + "cell_type": "code", + "execution_count": 22, + "id": "8003da8f-ded1-4f52-b6f3-cc9e110be1f5", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
                                                                  " + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "with s3_fsspec.open(s3_url) as f:\n", + " atl08_track = xarray.open_dataset(f, group='gt1l/land_segments/canopy', engine=\"h5netcdf\", phony_dims='sort')\n", + " atl08_track.h_canopy.plot()" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.10.13" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/docs/source/science/ESA_CCI/ESA_CCI_V4.ipynb b/docs/source/science/ESA_CCI/ESA_CCI_V4.ipynb index 27727306..df6b38a7 100644 --- a/docs/source/science/ESA_CCI/ESA_CCI_V4.ipynb +++ b/docs/source/science/ESA_CCI/ESA_CCI_V4.ipynb @@ -32,6 +32,8 @@ "This dataset comprises estimates of forest Above-Ground Biomass (AGB) for the years 2017, 2018, 2019 and 2020, version 4. They are derived from a combination of Earth Observation (EO) data, depending on the year, from the Copernicus Sentinel-1 mission, Envisat’s ASAR instrument and JAXA’s Advanced Land Observing Satellite (ALOS-1 and ALOS-2), along with additional information from Earth observation sources. The data has been produced as part of the European Space Agency's (ESA's) Climate Change Initiative (CCI) programme by the Biomass CCI team.\n", "\n", "### Additional Resources\n", + "* [Cloud Native Geoguide](https://guide.cloudnativegeo.org/)\n", + "* [Examples of Working with COGs](https://guide.cloudnativegeo.org/cloud-optimized-geotiffs/cogs-examples.html)\n", "* [ESA’s Climate Change Initiative Biomass project](https://climate.esa.int/en/odp/#/project/biomass)\n", "* [xarray Documentation](https://docs.xarray.dev/en/stable/index.html)\n", " " @@ -1582,7 +1584,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.10.8" + "version": "3.10.13" } }, "nbformat": 4, diff --git a/docs/source/science_examples.rst b/docs/source/science_examples.rst index 3729e8aa..f37edf83 100644 --- a/docs/source/science_examples.rst +++ b/docs/source/science_examples.rst @@ -11,8 +11,9 @@ Science Examples science/GEDI/GEDI_L2B.ipynb science/GEDI/GEDI_L3.ipynb science/GEDI/GEDI_L4A.ipynb - science/GEDI/GEDI_L4B.ipynb + science/GEDI/GEDI_L4B.ipynb science/ATL03/ATL03.ipynb + science/ATL08/ATL08.ipynb science/NISAR/NISAR_access.ipynb science/AfriSAR/AfriSAR_AGB.ipynb science/LVIS/accessing_LVIS_data.ipynb diff --git a/docs/source/system_reference_guide/ade_custom_extensions.rst b/docs/source/system_reference_guide/ade_custom_extensions.rst index caf09bb1..151349ae 100644 --- a/docs/source/system_reference_guide/ade_custom_extensions.rst +++ b/docs/source/system_reference_guide/ade_custom_extensions.rst @@ -1,4 +1,4 @@ -ADE Custom Extensions +Other Custom Extensions ======================================= .. toctree:: diff --git a/docs/source/system_reference_guide/ade_custom_extensions/maap_help.ipynb b/docs/source/system_reference_guide/ade_custom_extensions/maap_help.ipynb index e591685c..554a9ead 100644 --- a/docs/source/system_reference_guide/ade_custom_extensions/maap_help.ipynb +++ b/docs/source/system_reference_guide/ade_custom_extensions/maap_help.ipynb @@ -4,7 +4,7 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "# Maap Help Jupyter Extension\n", + "# MAAP Help Jupyter Extension\n", "This Jupyter extension provides an interactive tutorial on a new user's first launch of the ADE and adds MAAP specific information to the help tab. The interactive tutorial can be accessed again from the help menu. " ] }, diff --git a/docs/source/system_reference_guide/faq/import_granules.ipynb b/docs/source/system_reference_guide/faq/import_granules.ipynb index 8d6f6dea..b2ce78d0 100644 --- a/docs/source/system_reference_guide/faq/import_granules.ipynb +++ b/docs/source/system_reference_guide/faq/import_granules.ipynb @@ -7,17 +7,17 @@ "source": [ "# How Do I Import Granules Over From My EARTHDATA Search Into My Jupyter Notebook?\n", "\n", - "Launch EarthData Search by Data Search-> Open EarthData Search. After setting your search parameters or adding layers using the green plus, switch tabs back to your Jupyter notebook. At the top, open the Data Search menu, and select *Paste Search Results*.\n", + "Launch EarthData Search by Data Search-> Open EarthData Search. After setting your search parameters or adding layers using the green plus, switch tabs back to your Jupyter notebook. At the top, open the Data Search menu, and select *Paste Granule Search Results*.\n", "\n", - " ![Import Granules](../../_static/faq_images/import_granules_1.png) \n", + " ![Import Granules](../../_static/faq_images/import_granules.png) \n", " \n", - "Caveat: This call uses the MAAP Python library. Make sure you import it before running the inserted code. You can do this by clicking on the blue “MAAP” text just below your notebook name (circled in red)." + "Caveat: The *Paste Granule Search Query* call uses the MAAP Python library. Make sure you import it before running the inserted code. You can do this by clicking on the blue “MAAP” button just below your notebook name (upper left corner)." ] } ], "metadata": { "kernelspec": { - "display_name": "Python 3.11.1 64-bit", + "display_name": "Python 3.12.2 64-bit", "language": "python", "name": "python3" }, @@ -31,11 +31,11 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.11.1" + "version": "3.12.2" }, "vscode": { "interpreter": { - "hash": "5c7b89af1651d0b8571dde13640ecdccf7d5a6204171d6ab33e7c296e100e08a" + "hash": "b0fa6594d8f4cbf19f97940f81e996739fb7646882a419484c72d19e05852a7e" } } }, diff --git a/docs/source/system_reference_guide/jobs_maappy.ipynb b/docs/source/system_reference_guide/jobs_maappy.ipynb index e9e70e66..7b8084ba 100644 --- a/docs/source/system_reference_guide/jobs_maappy.ipynb +++ b/docs/source/system_reference_guide/jobs_maappy.ipynb @@ -75,7 +75,20 @@ "\n", "```\n", "'86fbac52-24b0-4963-8b67-59d0fc09946aSucceeded'\n", - "```" + "```\n", + "\n", + "### Job Status\n", + "Job status may be different between the HySDS Figaro job-monitoring dashboard and the Jobs UI. Below is a mapping of status terms:\n", + "```\n", + "MAAP <- HySDS\n", + "Accepted <- job-queued\n", + "Running <- job-started\n", + "Success <- job-completed\n", + "Failed <- job-offline or job-failed\n", + "job-revoked <- job-revoked (when a queued or running job is stopped before completion)\n", + "\n", + "HySDS state not valid/used in MAAP: job-deduped\n", + "```\n" ] }, { diff --git a/docs/source/system_reference_guide/jobsui.ipynb b/docs/source/system_reference_guide/jobsui.ipynb index a5316b58..ce5cbe47 100644 --- a/docs/source/system_reference_guide/jobsui.ipynb +++ b/docs/source/system_reference_guide/jobsui.ipynb @@ -19,7 +19,7 @@ "\n", "1. From your workspace click on the __View & Submit Jobs__ card on the Launcher tab.\n", "\n", - "![job_ui_access](../_static/jobs_ui_access.png)\n" + "![job_ui_access](../_static/jobs_ui/jobs_ui_access.png)\n" ] }, { @@ -33,7 +33,20 @@ "\n", "Users can sort jobs by queued, start, and end time in ascending/descending order. Users may use the search bar to filter the job list down to jobs containing the user-provided string in any of the fields shown. \n", "\n", - "![jobs_ui_overview](../_static/jobs_ui_overview.png)\n" + "![jobs_ui_overview](../_static/jobs_ui/jobs_ui_overview.png)\n", + "\n", + "### Job Status\n", + "Job status may be different between the HySDS Figaro job-monitoring dashboard and the Jobs UI. Below is a mapping of status terms:\n", + "```\n", + "MAAP <- HySDS\n", + "Accepted <- job-queued\n", + "Running <- job-started\n", + "Success <- job-completed\n", + "Failed <- job-offline or job-failed\n", + "job-revoked <- job-revoked (when a queued or running job is stopped before completion)\n", + "\n", + "HySDS state not valid/used in MAAP: job-deduped\n", + "```\n" ] }, { @@ -73,19 +86,19 @@ ".. note::\n", "Experimental feature: The output data will be put into a folder named for your Algorithm and the Job Tag. You can use the same Job Tag on several jobs (e.g. in a batch) to group related output data in one place. In [maap.py submitJob](jobs_maappy.ipynb#Submit-a-Job) this is the `identifier` field when you use submitJob().\n", "\n", - "![jobs_ui_submit](../_static/jobs_ui_submit.png)\n", + "![jobs_ui_submit](../_static/jobs_ui/jobs_ui_submit.png)\n", "\n", "Algorithms may contain additional inputs that users may have to provide.\n", "\n", - "![jobs_ui_submit_detail](../_static/jobs_ui_submit_detail.png)\n", + "![jobs_ui_submit_detail](../_static/jobs_ui/jobs_ui_submit_detail.png)\n", "\n", "Once all inputs have been provided, the user may click __Submit Job__ to submit the job. If the job was submitted successfully, a toast will appear in the bottom right corner containing the unique job id. Please give the __Submit Job__ button a second to execute. \n", "\n", - "![jobs_ui_submit_toast](../_static/jobs_ui_submit_toast.png)\n", + "![jobs_ui_submit_toast](../_static/jobs_ui/jobs_ui_submit_toast.png)\n", "\n", "If the job failed to submit, a toast will appear indicating the job failed to submit.\n", "\n", - "![jobs_ui_failed_toast](../_static/jobs_ui_failed_toast.png)" + "![jobs_ui_failed_toast](../_static/jobs_ui/jobs_ui_failed_toast.png)" ] }, { @@ -97,7 +110,36 @@ "\n", "Users may fill out the job submission form and - instead of submitting the job - click the __Copy Jupyter Notebook Code__ button to copy the __maap-py__ job submission command to their clipboard to then paste it into a Jupyter notebook.\n", "\n", - "![jobs_ui_copy_code](../_static/jobs_ui_copy_code.png)" + "![jobs_ui_copy_code](../_static/jobs_ui/jobs_ui_copy_code.png)" + ] + }, + { + "cell_type": "markdown", + "id": "84cf6298", + "metadata": {}, + "source": [ + "## Cancel Jobs\n", + "\n", + "Users may cancel queued or running jobs. Queued jobs that are cancelled will be deleted and no longer listed in the __View Jobs__ table. Running jobs that are cancelled will be stopped, but still viewable in the __View Jobs__ table. These jobs will have the status __job-revoked__.\n", + "\n", + ".. note::\n", + "Jobs that are listed as queued in the UI, then cancelled, may remain in the View Jobs table after the cancel request was submitted. This is due to a delay within the DPS between job state change and report of job state change. In these cases, the cancelled job was not really queued but had already started.\n", + "\n", + "1. In the View Jobs table, hover over the job entry you want to cancel to display the action bar.\n", + "\n", + "2. Click the cancel job button.\n", + "\n", + "![jobs_ui_revoke_job](../_static/jobs_ui/revoke_job.png)\n", + "\n", + "Once the cancel request is submitted, a toast will appear in the bottom right of the workspace indicating whether or not the request was successful.\n", + "\n", + "Successful submission:\n", + "![jobs_ui_revoke_success](../_static/jobs_ui/revoke_successful.png)\n", + "\n", + "Unsuccessful submission:\n", + "![jobs_ui_revoke_failed](../_static/jobs_ui/revoke_failed.png)\n", + "\n", + " " ] } ], diff --git a/docs/source/technical_tutorials.rst b/docs/source/technical_tutorials.rst index 45fc6821..785fb9cd 100644 --- a/docs/source/technical_tutorials.rst +++ b/docs/source/technical_tutorials.rst @@ -5,6 +5,7 @@ Technical Tutorials :maxdepth: 2 + technical_tutorials/dps_tutorial/dps_tutorial_demo.ipynb technical_tutorials/searching.rst technical_tutorials/visualizing.rst technical_tutorials/accessing.rst diff --git a/docs/source/technical_tutorials/access/accessing_cod.ipynb b/docs/source/technical_tutorials/access/accessing_cod.ipynb index 323871b5..33b583ea 100644 --- a/docs/source/technical_tutorials/access/accessing_cod.ipynb +++ b/docs/source/technical_tutorials/access/accessing_cod.ipynb @@ -35,6 +35,8 @@ "source": [ "## Additional Resources\n", "\n", + "- [Cloud Native Geoguide](https://guide.cloudnativegeo.org/)\n", + "- [Examples of Working with COGs](https://guide.cloudnativegeo.org/cloud-optimized-geotiffs/cogs-examples.html)\n", "- [Using pystac-client](https://pystac-client.readthedocs.io/en/stable/api.html)\n" ] }, @@ -1156,9 +1158,9 @@ ], "metadata": { "kernelspec": { - "display_name": "gedi_subset", + "display_name": "Python 3 (ipykernel)", "language": "python", - "name": "gedi_subset" + "name": "python3" }, "language_info": { "codemirror_mode": { @@ -1170,7 +1172,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.11.3" + "version": "3.10.13" } }, "nbformat": 4, diff --git a/docs/source/technical_tutorials/access/edav_wcs_data.ipynb b/docs/source/technical_tutorials/access/edav_wcs_data.ipynb index 7dab1074..346ffe2c 100644 --- a/docs/source/technical_tutorials/access/edav_wcs_data.ipynb +++ b/docs/source/technical_tutorials/access/edav_wcs_data.ipynb @@ -28,6 +28,8 @@ "metadata": {}, "source": [ "## Additional Resources\n", + "- [Cloud Native Geoguide](https://guide.cloudnativegeo.org/)\n", + "- [Examples of Working with COGs](https://guide.cloudnativegeo.org/cloud-optimized-geotiffs/cogs-examples.html)\n", "- [Raster data handling with Python](https://geoscripting-wur.github.io/PythonRaster/)\n", "- [OWSLib Github](https://github.com/geopython/OWSLib)\n", "- [rioxarray Documentation](https://corteva.github.io/rioxarray)" @@ -440,7 +442,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.10.12" + "version": "3.10.13" } }, "nbformat": 4, diff --git a/docs/source/technical_tutorials/dps_tutorial/_static/alg-reg-2.png b/docs/source/technical_tutorials/dps_tutorial/_static/alg-reg-2.png new file mode 100644 index 00000000..bcac0f75 Binary files /dev/null and b/docs/source/technical_tutorials/dps_tutorial/_static/alg-reg-2.png differ diff --git a/docs/source/technical_tutorials/dps_tutorial/_static/dps_tutorial_git_repo.png b/docs/source/technical_tutorials/dps_tutorial/_static/dps_tutorial_git_repo.png new file mode 100644 index 00000000..79f740fb Binary files /dev/null and b/docs/source/technical_tutorials/dps_tutorial/_static/dps_tutorial_git_repo.png differ diff --git a/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_register_1.png b/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_register_1.png new file mode 100644 index 00000000..ae50899d Binary files /dev/null and b/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_register_1.png differ diff --git a/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_register_2.png b/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_register_2.png new file mode 100644 index 00000000..93728072 Binary files /dev/null and b/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_register_2.png differ diff --git a/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_register_3.png b/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_register_3.png new file mode 100644 index 00000000..f1c92165 Binary files /dev/null and b/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_register_3.png differ diff --git a/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_register_4.png b/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_register_4.png new file mode 100644 index 00000000..86efea76 Binary files /dev/null and b/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_register_4.png differ diff --git a/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_register_5.png b/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_register_5.png new file mode 100644 index 00000000..d979b8ba Binary files /dev/null and b/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_register_5.png differ diff --git a/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_register_6.png b/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_register_6.png new file mode 100644 index 00000000..62bc4059 Binary files /dev/null and b/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_register_6.png differ diff --git a/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_submit_1.png b/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_submit_1.png new file mode 100644 index 00000000..fdb446e0 Binary files /dev/null and b/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_submit_1.png differ diff --git a/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_submit_2.png b/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_submit_2.png new file mode 100644 index 00000000..a9516f6d Binary files /dev/null and b/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_submit_2.png differ diff --git a/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_view_1.png b/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_view_1.png new file mode 100644 index 00000000..81335c4b Binary files /dev/null and b/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_view_1.png differ diff --git a/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_view_2.png b/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_view_2.png new file mode 100644 index 00000000..09a24f6e Binary files /dev/null and b/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_view_2.png differ diff --git a/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_view_3.png b/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_view_3.png new file mode 100644 index 00000000..be70ad88 Binary files /dev/null and b/docs/source/technical_tutorials/dps_tutorial/_static/tutorial_view_3.png differ diff --git a/docs/source/technical_tutorials/dps_tutorial/dps_tutorial_demo.ipynb b/docs/source/technical_tutorials/dps_tutorial/dps_tutorial_demo.ipynb new file mode 100644 index 00000000..1b72d081 --- /dev/null +++ b/docs/source/technical_tutorials/dps_tutorial/dps_tutorial_demo.ipynb @@ -0,0 +1,541 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Data Processing System (DPS) Tutorial A to Z" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Authors: Sujen Shah and Rob Tapella\n", + "\n", + "Review and Editing: Chuck Daniels and Rajat Shinde\n", + "\n", + "Date: April, 2024\n", + "\n", + "Description: This DPS tutorial is intended to demonstrate the steps needed to create, register, run, monitor and view outputs of algorithm jobs run at scale. It includes a template repository with various files needed to set up and run a job. " + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Importing and Installing Packages" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Additional package installation will be included inline, and environment-configuration to support a custom conda environment in DPS is a part of the tutorial below." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Before Starting\n", + "\n", + "- This tutorial assumes that you have at least run through the [Getting Started Guide](../../getting_started/getting_started.ipynb) and have set up your MAAP account.\n", + "- This tutorial is made for the Application Development Environment (ADE) \"Basic Stable\" workspace v3.1.4 or later (February 2024 or later).\n", + "- This also assumes that you are familiar with using [Github with MAAP](../../system_reference_guide/work_with_git.ipynb)." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## An Overview of How DPS Works" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The MAAP DPS (Data Processing System) lets you run an Algorithm at scale, in the cloud. It is different from running a Jupyter notebook in that it is non-interactive. Therefore, when migrating a notebook to the DPS it needs to be altered to take all of the input parameters at once as a command-line program. Even if you start with a command-line script, there are best practices to follow when preparing it for the DPS. Once that is done, the Algorithm can be Registered in a way that allows you to execute analysis jobs using a web-based form, where each field is defined during the Registration process.\n", + "\n", + "The DPS will then be able to take a set of inputs and process them at scale. You do not need to worry about scheduling or scaling your jobs. You can also run your DPS Algorithm using the maap.py Python library in a loop to execute a batch of jobs (e.g., 1000 input files and one job per input-file). The DPS will manage the compute resources to handle your request, and you can easily find all of your outputs as each individual job completes." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Overview of this Tutorial" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "- Run and Monitor an example Algorithm using the Jobs UI to help anticipate what we will accomplish\n", + "- Clone the demo Algorithm\n", + "- Edit and test your Algorithm code to make sure that it is working in its original form\n", + "- Prepare the Algorithm for DPS by setting up the runtime arguments and pre-run environment set-up\n", + "- Register the Algorithm with the Algorithm UI\n", + "- Run and Monitor the Algorithm using the Jobs UI\n", + "- View the outputs and errors from your run" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Run and Monitor an example Algorithm" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "If you are not familiar with running jobs in the DPS, please try running through the [Jobs UI guide](../../system_reference_guide/jobsui.ipynb) and the [Getting Started Guide](../../getting_started/running_at_scale.ipynb).\n", + "\n", + "This can be helpful because the process of Registering an Algorithm for DPS helps to build the user-interface to Run a Job. By familiarizing yourself with the process of running a Job, the Registration process may become more intuitive." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Clone the Demo Algorithm" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We will use an example Python-based algorithm for this tutorial. First we need to get the demo code into a Jupyter workspace.\n", + "\n", + "1. For this tutorial, please use a Basic Stable workspace (v3.1.4 or later). \n", + "2. Clone the Github repository at https://github.com/MAAP-Project/dps_tutorial . For the sake of this tutorial, we will assume that the clone is placed into a folder called algorithms in our home folder (i.e., ~/algorithms).\n", + "```\n", + "mkdir ~/algorithms\n", + "cd ~/algorithms\n", + "git clone https://github.com/MAAP-Project/dps_tutorial.git\n", + "```\n", + "\n", + "An algorithm needs to be in a public code-repository in order to register it with the DPS. For this tutorial we will use the `gdal_wrapper` algorithm folder inside the `dps_tutorial` repository code. Now that you have the demonstration code, take a look at the files that are there and then we will be ready to perform a few test-runs before Registering it.\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Anatomy of the `gdal_wrapper` algorithm folder in the `dps_tutorial` repo:\n", + "\n", + "- `README.md` to describe the algorithm in Github\n", + "- `build-env.sh`: a shell script that is executed before the algorithm is run; it is used to set up any custom programming libraries used in the algorithm (i.e., a custom conda environment)\n", + "- `environment.yml`: a configuration file used by conda to add any custom libraries; this is used by build-env.sh\n", + "- `gdal_wrapper.py`: a python script that contains the logic of the algorithm\n", + "- `run_gdal.sh`: a shell script that DPS will execute when a run is requested. It calls any relevant python files with the required inputs\n", + "\n", + "![DPS Tutorial Git repository overview](_static/dps_tutorial_git_repo.png)\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Edit and Test your Code" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Once you have an algorithm such as the `gdal_wrapper` test it to make sure that it is running properly. If it runs properly in a Jupyter Terminal window, you are one step closer to registering and running your algorithm in the DPS.\n", + "\n", + "Typically a Jupyter Notebook is run interacively. A DPS algorithm will take all inputs up-front, do the processing, and produce output files. The `gdal_wrapper` script is already set up like a DPS algorithm. Some aspects to note:\n", + "\n", + "- **Python argparse**: Using a library like [argparse](https://docs.python.org/3/library/argparse.html) to accept input parameters helps to make the code more readable and easier to debug when working locally. It provides easy to write user-friendly command-line interface. \n", + "\n", + "- **Logging**: It is a good practice to write out a log file during the execution of your code making it easier to debug. When running on the DPS, any logs written to the `output` directory or written to `stdout` or `stderr` will automatically be preserved. \n", + "\n", + "### Testing the Python script locally within the workspace\n", + "\n", + "Before registering your algorithm you can test it locally to catch common errors related to input parsing and storing output. To test your algorithm locally before registration follow the below steps:\n", + "\n", + "- Deactivate the current python virtual environment and activate the pre-installed conda environment (for the Basic Stable workspace, it is vanilla)\n", + "```\n", + "conda deactivate\n", + "conda activate vanilla\n", + "```\n", + "- Make sure that your runtime conda environment is set up. To do this, run `build-env.sh` in the `gdal_wrapper` folder.\n", + "```\n", + "cd ~/algorithms\n", + "cd dps_tutorial/gdal_wrapper\n", + "./build-env.sh\n", + "```\n", + "- Make a new temporary directory outside your current repository. This is where you will do a test-run of your algorithm with some inputs and outputs.\n", + "```\n", + "mkdir ~/algorithms/dps_test_run\n", + "cd ~/algorithms/dps_test_run\n", + "```\n", + "- Create a directory called `input` and place any input files required by your algorithm. Here you will need to download any input files up-front, and then run your script. Also make an `output` folder. When you have registered your algorithm and run it in DPS, the input file can be passed in as a runtime parameter and DPS will automatically download it as part of the run.\n", + "```\n", + "mkdir input\n", + "mkdir output\n", + "```\n", + "```\n", + "# ls -F\n", + "input/ output/\n", + "```\n", + "- You will need a test GeoTIF file as input. If you do not have one, go to the folder where you'd like to download the example file (assuming you're in the `dps_test_run` folder as above, `cd input`) and use the following aws command (NOTE: if this step fails, it is likely that you are either in a Basic Stable workspace version prior to v3.1.4, or you do not have the vanilla conda environment activated):\n", + "```\n", + "cd input\n", + "```\n", + "```\n", + "aws s3 cp s3://nasa-maap-data-store/file-staging/nasa-map/ESACCI_Biomass_L4_AGB_V4_100m_2020/S40E160_ESACCI-BIOMASS-L4-AGB-MERGED-100m-2020-fv4.0.tif .\n", + "```\n", + "- Once the input directory is set up, `cd ..` back to the `dps_test_run` directory and call your run script. This is the script you would like the DPS to run when your code is executing on the cloud. Note: This assumes you have already built the environment with required custom packages as mentioned in the build-env.sh of your algorithm. We did this above.\n", + "```\n", + "cd ~/algorithms/dps_test_run\n", + "```\n", + "```\n", + "python ../dps_tutorial/gdal_wrapper/gdal_wrapper.py --input_file input/S40E160_ESACCI-BIOMASS-L4-AGB-MERGED-100m-2020-fv4.0.tif --output_file output/TestFile-30.tif --outsize 30\n", + "```\n", + "- Successful output of the script should look like this:\n", + "```\n", + "Installed GDAL Version: 3.6.1\n", + "b'Input file size is 2400, 3600\\n0...10...20...30...40...50...60...70...80...90...100 - done.\\n'\n", + "```\n", + "\n", + "And if you look in your output folder, you will see your output file:\n", + "```\n", + "# ls output/\n", + "TestFile-30.tif\n", + "```\n", + "\n", + "- If all desired outputs are created, you are one step closer to successfully running your algorithm on the DPS. Your core application can be run at a command-line in a non-interactive mode.\n", + "- The next step is to prepare the Algorithm to be run in DPS.\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Prepare the Algorithm for DPS" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Once your scripts are working locally, make sure that they will also work in DPS.\n", + "\n", + "The `gdal_wrapper` files are already prepared for DPS. When running from DPS we will have the `run_gdal.sh` shell script do the execution, so we should test it first:\n", + "```\n", + "cd ~/algorithms/dps_test_run\n", + "```\n", + "```\n", + "../dps_tutorial/gdal_wrapper/run_gdal.sh output_from_shell.tif 25\n", + "```\n", + "\n", + "This should write a similar message to STDOUT that you saw when executing `gdal_wrapper.py` above. You should see an output file that is slightly smaller than the original test run because we chose a smaller value for the `outsize` parameter.\n", + "\n", + "The shell script is wrapping the Python script that we ran above. Note that there are different parameters—-in the shell script we read all the input files from `input/` and write outputs into the `output/` folder. If you read the shell script you will see how this is happening.\n", + "```\n", + "# ../dps_tutorial/gdal_wrapper/run_gdal.sh output_from_shell.tif 25\n", + "Installed GDAL Version: 3.7.0\n", + "b'Input file size is 11250, 11250\\n0...10...20...30...40...50...60...70...80...90...100 - done.\\n'\n", + "\n", + "# ls -alF *\n", + "input:\n", + "total 7696\n", + "drwxr-xr-x 2 root root 6144 Feb 28 15:52 ./\n", + "drwxr-xr-x 4 root root 6144 Feb 28 15:52 ../\n", + "-rw-r--r-- 1 root root 7869236 Jun 7 2023 S40E160_ESACCI-BIOMASS-L4-AGB-MERGED-100m-2020-fv4.0.tif\n", + "\n", + "output:\n", + "total 20488\n", + "drwxr-xr-x 2 root root 6144 Feb 28 15:54 ./\n", + "drwxr-xr-x 4 root root 6144 Feb 28 15:52 ../\n", + "-rw-r--r-- 1 root root 22804732 Feb 28 15:53 TestFile-30.tif\n", + "-rw-r--r-- 1 root root 15834792 Feb 28 15:54 output_from_shell.tif\n", + "```\n", + "\n", + "Some important things to note:\n", + "\n", + "File: `build-env.sh`\n", + "\n", + "- this script is used for installing custom packages using pip or conda \n", + "- can take conda environment definition from `environment.yaml`\n", + "- current practice is to update the default environment for the Container that you're using\n", + "\n", + "File: `run_gdal.sh`\n", + "\n", + "- `run_gdal.sh` is a bash script to call the `gdal_wrapper.py` algorithm: make sure for DPS you have inputs and outputs in the right places. If you look at `run_gdal.sh` you will see that it is reading all the files from the `input/` folder and writing to the `output/` folder.\n", + "- sets the correct python environment for your code to run\n", + "- the best way to execute your algorithm with a custom environment is to use `conda run`, as shown in this script (`conda run --live-stream --name dps_tutorial python ${basedir}/gdal_wrapper.py --input_file ${INPUT_FILENAME} --output_file output/${OUTPUT_FILENAME} --outsize ${REDUCTION_SIZE}`)\n", + "\n", + "Run your scripts as if DPS is executing them:\n", + "\n", + "- activate the default conda environment, in this case `conda activate vanilla`\n", + "- run `build-env.sh` to create or update your custom environment\n", + "- run `run_gdal.sh` to execute your algorithm using the custom environment\n", + "\n", + "Future topics:\n", + "\n", + "- What happens with input and output in DPS\n", + "- How does file management happen?\n", + "- Relative paths vs. absolute for input/output\n", + "- Mimic what’s happening on DPS (basedir)\n", + "- This wrapper `run_gdal.sh` script needs to manage the input files the way that your python script requires them (e.g. pass single file at a time vs. multiple files at once, etc.)\n", + "\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Register the Algorithm with DPS using the Algorithm UI" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "0. When you are registering your own algorithm, make sure that all your changes are commited and pushed into Github. The registration process will pull the code from Github as part of registration. In this case, we will simply use the existing demonstration repo.\n", + "1. Open up [Launcher: Register Algorithm](../../getting_started/running_at_scale.ipynb#Register-an-Algorithm) (the same as the Register Algorithm option from the Command Palette)\n", + "2. Fill in the fields as described below.\n", + "\n", + "#### First you fill in the public code-repository information:\n", + "![Code repo information](_static/tutorial_register_1.png)\n", + "\n", + "- The Repository URL is the .git URL. In the demo repository, it is\n", + "```\n", + "https://github.com/MAAP-Project/dps_tutorial.git\n", + "```\n", + "- Repository Branch is used as a version when this algorithm is registered. For your test it is likely `main`\n", + "- The Run and Build Commands must be the full path of the scripts that will be used by the DPS to build and execute the algorithm. Typically these will be the `repository_name/script_name.sh`. In this case we have a run command:\n", + "```\n", + "dps_tutorial/gdal_wrapper/run_gdal.sh\n", + "```\n", + "and a build command:\n", + "```\n", + "dps_tutorial/gdal_wrapper/build-env.sh\n", + "```\n", + "\n", + "#### Then fill in the rest of the algorithm information:\n", + "![Algorithm information](_static/tutorial_register_2.png)\n", + "\n", + "- The Algorithm Name will be the unique identifier for the algorithm in the MAAP system. It can be whatever you want. \n", + "- Algorithm Description is additional free-form text to describe what this algorithm does.\n", + "- Disk Space is the minimum amount of space you expect—including all inputs, scratch, and outputs—it gives the DPS an approximation to help optimize the run.\n", + "- Resource Allocation is a dropdown-selection with some options for memory and CPU of the cloud compute you expect to need.\n", + "- The Container URL is a URL of the Stack (workspace image environment) you are using as a base for the algorithm. The user-interface will pre-fill this with the Container of your current workspace; if this is the correct base workspace for the Algorithm (i.e., you successfully ran the Algorithm in a Terminal without requiring a custom base-Container), then you can leave it as is. In this example we use: `mas.maap-project.org/root/maap-workspaces/base_images/vanilla:main`\n", + "See [the Getting Started guide](../../getting_started/running_at_scale.ipynb#Container-URLs) for more information on Containers.\n", + "\n", + "#### Finally you fill in the input section:\n", + "- There are File Inputs and Positional Inputs (command-line parameters to adjust how the algorithm runs). In our example we have a File Input called `input_file` and two Positional Inputs: an output file called `output_file` and a parameter called `outsize` describing how much file-size reduction we want to get. For each input you can add a Description, a Default Value, and mark whether it’s required or optional.\n", + "\n", + "![Algorithm-Inputs information](_static/tutorial_register_3.png)\n", + "\n", + "4. Press Register and there will a popup dialog with a link to view progress of the registration (you should copy the link and paste it into a new page, or open it in a new browser tab). If you close this modal, you can look for your Algorithm build at https://repo.maap-project.org/root/register-job-hysds-v4/-/jobs/\n", + "![Register confirmation popup information](_static/tutorial_register_4.png)\n", + "\n", + "In order to continue, your Algorithm must be successfully registered. The link from the modal dialog will have a screen with a progress log in it. If it is successful and complete, the bottom of the log will look something like this:\n", + "![Registration process log complete](_static/tutorial_register_5.png)\n", + "\n", + "If the registration process failed, the log will look like the below screenshot. In this case you will need to either ask for help, or scroll back up through the log to see what went wrong.\n", + "![Registration process log failed](_static/tutorial_register_6.png)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Running and Monitoring the Algorithm with the Jobs UI" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Once your Algorithm has been fully registered, you can try running a Job.\n", + "\n", + "1. Open the Launcher and select the [Submit Jobs](../../getting_started/running_at_scale.ipynb#Run-the-Algorithm-as-a-Job-and-Monitor-it) icon\n", + "2. Run the job. \n", + "- Choose the Algorithm you just registered using the dropdown menu.\n", + "- The Job Tag can be empty or any list of short terms that you would like to associate with your job. This will help you sort and filter the job list later. It is a comma-separated list of tags.\n", + "- The Resource is likely to be the same as the one you chose when registering the Algorithm. For the tutorial it can be the smallest one (8 GB).\n", + "- The input file can be any GeoTIF file that is accessible by the system. For example, you can browse the [MAAP STAC](https://stac-browser.maap-project.org/collections/ESACCI_Biomass_L4_AGB_V4_100m?.language=en) and find a GeoTIF. For example\n", + "```\n", + "s3://nasa-maap-data-store/file-staging/nasa-map/ESACCI_Biomass_L4_AGB_V4_100m_2020/S40E160_ESACCI-BIOMASS-L4-AGB-MERGED-100m-2020-fv4.0.tif\n", + "```\n", + "- The output file can have any name. It should end with .tif because it will be a GeoTIF also.\n", + "- Outsize is a number from 1 to 100.\n", + "![Submit Job Page](_static/tutorial_submit_1.png)\n", + "\n", + "3. Submit the job and go back to the View tab\n", + "- When you submit you should see a notification in the bottom right, and a note just under the Submit button, saying that it was successful\n", + "![Submit Success Notification](_static/tutorial_submit_2.png)\n", + "- at that point, open the Launcher -> View Jobs icon\n", + "\n", + "4. You can observe the progress of your job while it runs, and the status (complete or fail) when it completes using the View Jobs tab\n", + "![View Jobs Page](_static/tutorial_view_1.png)\n", + "- By selecting a row from the table (top panel) it will show Job Details (in the bottom panel)\n", + "- The status should go from queued to running, to completed or failed\n", + "- Check the Inputs and Outputs sections of the Job Details\n", + "\n", + "5. From the Outputs section, you can copy the path of your output file starting with `dps_outputs` and find it by going to your `~/my-private-bucket` folder and then following the remainder of the path. \n", + "![Copy the Path information](_static/tutorial_view_2.png)\n", + "\n", + "In that folder you will see some JSON files with metadata about the job and the data, as well as the output file (your .tif file).\n", + "![cd to path using Terminal](_static/tutorial_view_3.png)\n", + "\n", + "You can download the output files by browsing to them in the Jupyter file panel and selecting Download from the contextual menu (right-click)." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Running and Monitoring using the HySDS Jobs UI (Figaro)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "This will be described in a future update. HySDS is the data-processing system used to run the jobs. It has a full web application that is used by NASA missions to monitor jobs and data-outputs. If you would like to beta-test this UI with MAAP, please contact Sujen or George." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Registering and Running the Algorithm using maap.py" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "This will be described in a future update. Often larger batch-jobs are run from Python Notebooks rather than the GUI." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Getting the Outputs of the Job" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "#### Output folder\n", + "\n", + "The DPS treats a folder named `output` specially. Any files stored in this folder will be preserved and uploaded to S3 after the algorithm run is complete. The location of this output will depend on factors like algorithm name, time of run, tags, etc. This output folder can be viewed within your workspace under the `my-private-bucket/dps_output` directory.\n", + "\n", + "The output directory is created relative to your script specified in `run_command` at the time of registration. So to access the directory, simply do something like this in your run script. \n", + "```\n", + "mkdir -p output\n", + "``` \n", + " \n", + "#### Stderr & Stdout \n", + "\n", + "By default, anything written to the stderr and stdout pipes will be stored in files call _stderr and _stdout and placed in your output directory. \n", + "\n", + "#### Logfiles\n", + "\n", + "DPS does not automatically store any logfiles written by your algorithm, if you would like them to be preserved make sure to write them in the output directory. " + ] + }, + { + "cell_type": "markdown", + "metadata": { + "collapsed": false + }, + "source": [ + "## Frequently Asked Questions (FAQ)" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "collapsed": false + }, + "source": [ + "### What happens with input and output in DPS?\n", + "\n", + "Since the jobs on DPS are run on a machine on the cloud, your local workspace directories are not available. It is important to pass any files required as inputs for your algorithm using the `File` parameter type. \n", + "Any outputs that need to be saved should be placed in a directory called `output`. \n", + "\n", + "When a parameter is registered as a file input, DPS downloads the corresponding value provided by the user as a file and places it in a directory called `input`. \n", + "It is important to note that if the value provided a parameter marked as file during registration is not a valid url, DPS will report an error.\n", + "\n", + "Note: Both `input` and `output` directories are relative to your run script. \n", + " \n", + "### How does file management happen?\n", + "\n", + "File management i.e. files required for input and files stored as outputs on S3 are taken care of by the DPS. To locate the files created as an output from your job, look into the `/projects/my-private-bucket/dps_output` dir on your workspace and navigate to the algorithm type and time of run. \n", + "\n", + "You can also construct the output path of your files by looking at the job info on the Jobs UI or by running \n", + "```maap.getJobResult('job_id')```\n", + "\n" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "collapsed": false + }, + "source": [ + "### What is the basedir variable in the run script example?\n", + "\n", + "As we now know that your job on the DPS runs on a cloud machine, it is not possible to know the absolute path of your script before execution. \n", + "Using \n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "collapsed": false, + "is_executing": true + }, + "outputs": [], + "source": [ + "#basedir=$(dirname \"$(readlink -f \"$0\")\")" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "collapsed": false + }, + "source": [ + "allows you to get the absolute path of the directory in which your run script is present allowing you to set any other executable paths as required by your algorithm. \n", + "\n" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "gedi_subset", + "language": "python", + "name": "gedi_subset" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.11.3" + } + }, + "nbformat": 4, + "nbformat_minor": 4 +} diff --git a/docs/source/technical_tutorials/user_data.rst b/docs/source/technical_tutorials/user_data.rst index d235a4c5..a76b102b 100644 --- a/docs/source/technical_tutorials/user_data.rst +++ b/docs/source/technical_tutorials/user_data.rst @@ -5,4 +5,5 @@ User Data :maxdepth: 2 :caption: User Data: - user_data/create-datasets-for-dashboard.ipynb \ No newline at end of file + user_data/create-datasets-for-dashboard.ipynb + user_data/memory-profiling-python.ipynb \ No newline at end of file diff --git a/docs/source/technical_tutorials/user_data/create-datasets-for-dashboard.ipynb b/docs/source/technical_tutorials/user_data/create-datasets-for-dashboard.ipynb index 08d54bc0..43ed897f 100644 --- a/docs/source/technical_tutorials/user_data/create-datasets-for-dashboard.ipynb +++ b/docs/source/technical_tutorials/user_data/create-datasets-for-dashboard.ipynb @@ -48,6 +48,8 @@ "metadata": {}, "source": [ "## Additional Resources\n", + "- [Cloud Native Geoguide](https://guide.cloudnativegeo.org/)\n", + "- [Examples of Working with COGs](https://guide.cloudnativegeo.org/cloud-optimized-geotiffs/cogs-examples.html)\n", "- [Rio Tiler Colors](https://cogeotiff.github.io/rio-tiler/colormap/)\n", "- [Matplotlib Colors](https://matplotlib.org/stable/tutorials/colors/colormaps.html) " ] @@ -1195,7 +1197,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.10.8" + "version": "3.10.13" } }, "nbformat": 4, diff --git a/docs/source/technical_tutorials/user_data/demo_memory_profiling.py b/docs/source/technical_tutorials/user_data/demo_memory_profiling.py new file mode 100644 index 00000000..33f1e5cf --- /dev/null +++ b/docs/source/technical_tutorials/user_data/demo_memory_profiling.py @@ -0,0 +1,24 @@ +from memory_profiler import profile + +@profile +def my_function(): + # Include each line of the script which needs to be profiled + # under this function + + return 0 + +@profile +def my_other_function(): + # Include each line of the script which needs to be profiled + # under this function + + return 0 + +def main(): + my_function() + my_other_function() + + #... + +if __name__ == "__main__": + main() \ No newline at end of file diff --git a/docs/source/technical_tutorials/user_data/demo_memory_profiling_logging.py b/docs/source/technical_tutorials/user_data/demo_memory_profiling_logging.py new file mode 100644 index 00000000..7ed1ae8e --- /dev/null +++ b/docs/source/technical_tutorials/user_data/demo_memory_profiling_logging.py @@ -0,0 +1,27 @@ +from memory_profiler import profile + +fp=open('memory_profiler.log','w+') +@profile(stream=fp) +def my_function(): + # Include each line of the script which needs to be profiled + # under this function + + return 0 + +@profile(stream=fp) +def my_other_function(): + # Include each line of the script which needs to be profiled + # under this function + + return 0 + +def main(): + my_function() + my_other_function() + + #... + +if __name__ == "__main__": + main() + + \ No newline at end of file diff --git a/docs/source/technical_tutorials/user_data/memory-profiling-python.ipynb b/docs/source/technical_tutorials/user_data/memory-profiling-python.ipynb new file mode 100644 index 00000000..6347f8a2 --- /dev/null +++ b/docs/source/technical_tutorials/user_data/memory-profiling-python.ipynb @@ -0,0 +1,278 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "8f399a66-d82e-4210-a08e-4501903b6e2b", + "metadata": { + "tags": [] + }, + "source": [ + "# Memory Profiling Python Scripts in the MAAP ADE\n", + "\n", + "Authors: Rajat Shinde (UAH), Alex Mandel (DevSeed), Jamison French (DevSeed), Sheyenne Kirkland (UAH), Brian Freitag (NASA MSFC), Chuck Daniels (DevSeed)\n", + "\n", + "Date: February 7, 2024\n", + "\n", + "Description: Memory profiling your Python script is a good practice to understand the resource requirements. This is useful when you have working code and you want to estimate the size of the DPS worker to be used. Additionally, it is helpful to optimize the code for resource requirements. \n", + "\n", + "In this tutorial, we will use [memory-profiler](https://pypi.org/project/memory-profiler/) for profiling a sample Python script [demo_memory_profiling.py](./demo_memory_profiling.py). We also see how to log the output to a `.log` file. \n", + "\n", + "### Run This Notebook\n", + "To access and run this tutorial within MAAP's Algorithm Development Environment (ADE), please refer to the [\"Getting started with the MAAP\"](https://docs.maap-project.org/en/latest/getting_started/getting_started.html) section of our documentation.\n", + "\n", + "Disclaimer: It is highly recommended to run a tutorial within MAAP's ADE, which already includes packages specific to MAAP, such as maap-py. Running the tutorial outside of the MAAP ADE may lead to errors.\n", + "\n", + "### Additional Resources\n", + "\n", + "1. [https://github.com/pythonprofilers/memory_profiler](https://github.com/pythonprofilers/memory_profiler)" + ] + }, + { + "cell_type": "markdown", + "id": "24efa20c-66e9-45d2-bc6d-695b38329158", + "metadata": {}, + "source": [ + "### Installation \n", + "\n", + "We will begin by installing `memory-profiler` in the current working environment." + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "id": "c54089e1-d6ec-4386-95da-06fdd3c357cb", + "metadata": { + "tags": [] + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Collecting memory-profiler\n", + " Using cached memory_profiler-0.61.0-py3-none-any.whl (31 kB)\n", + "Requirement already satisfied: psutil in /opt/conda/envs/vanilla/lib/python3.10/site-packages (from memory-profiler) (5.9.7)\n", + "Installing collected packages: memory-profiler\n", + "Successfully installed memory-profiler-0.61.0\n", + "\u001b[33mWARNING: Running pip as the 'root' user can result in broken permissions and conflicting behaviour with the system package manager. It is recommended to use a virtual environment instead: https://pip.pypa.io/warnings/venv\u001b[0m\u001b[33m\n", + "\u001b[0m" + ] + } + ], + "source": [ + "# !pip install -U memory-profiler" + ] + }, + { + "cell_type": "markdown", + "id": "5a3baaf1-8d1b-4e61-9798-f205fc2648fd", + "metadata": {}, + "source": [ + "### Add Decorator \n", + "\n", + "Typically, line-by-line memory usage is required for analyzing code. For this example, we are creating dummy functions to be profiled, named `my_function` and `my_other_function`. \n", + "\n", + "You may add the `@profile` decorator to individual functions that you want to profile. This allows you to limit which parts of your program are profiled, thus limiting the volume of profiling output.\n", + "\n", + "However, this requires you to modify your code. If you wish to avoid modifying your code, particularly when it is not yet obvious which parts of your code may be consuming too much memory, simply add the `-m memory_profiler` to the python command." + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "id": "f4c9941c-e8b8-4c3c-b545-a173284248d8", + "metadata": { + "tags": [] + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "ERROR: Could not find file /tmp/ipykernel_314/3429381877.py\n", + "ERROR: Could not find file /tmp/ipykernel_314/3429381877.py\n" + ] + } + ], + "source": [ + "from memory_profiler import profile\n", + "\n", + "@profile\n", + "def my_function():\n", + " # Perform some potentially memory-intensive computation\n", + " \n", + " return 0\n", + "\n", + "@profile\n", + "def my_other_function():\n", + " # Perform some potentially memory-intensive computation\n", + " \n", + " return 0\n", + "\n", + "def main():\n", + " my_function()\n", + " my_other_function()\n", + " \n", + " #...\n", + "\n", + "if __name__ == \"__main__\":\n", + " main()" + ] + }, + { + "cell_type": "markdown", + "id": "de6a276c-78a9-4769-9fa8-f387deaac9de", + "metadata": {}, + "source": [ + "### Running Memory Profiler \n", + "\n", + "For understanding how to run memory profiler on an existing Python script from a Jupyter notebook, we copied the code snippet from above to a file named `demo_memory_profiling.py` in the working directory. After executing the Python script, we can see the details about memory usage and increment due to a particular line in the output." + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "id": "dababd0c-74e8-4b26-ae15-f25ccbac3c0e", + "metadata": { + "tags": [] + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Filename: /projects/maap-documentation/docs/source/technical_tutorials/user_data/demo_memory_profiling.py\n", + "\n", + "Line # Mem usage Increment Occurrences Line Contents\n", + "=============================================================\n", + " 6 43.6 MiB 43.6 MiB 1 @profile\n", + " 7 def my_function():\n", + " 8 # Include each line of the script which needs to be profiled\n", + " 9 # under this function\n", + " 10 \n", + " 11 43.6 MiB 0.0 MiB 1 return 0\n", + "\n", + "\n", + "Filename: /projects/maap-documentation/docs/source/technical_tutorials/user_data/demo_memory_profiling.py\n", + "\n", + "Line # Mem usage Increment Occurrences Line Contents\n", + "=============================================================\n", + " 13 43.6 MiB 43.6 MiB 1 @profile\n", + " 14 def my_other_function():\n", + " 15 # Include each line of the script which needs to be profiled\n", + " 16 # under this function\n", + " 17 \n", + " 18 43.6 MiB 0.0 MiB 1 return 0\n", + "\n", + "\n" + ] + } + ], + "source": [ + "# With @profile decorator in the script\n", + "\n", + "!python demo_memory_profiling.py" + ] + }, + { + "cell_type": "markdown", + "id": "8122d39c-d7d8-4db4-9b08-b89280ee24ce", + "metadata": {}, + "source": [ + "### Logging the Output\n", + "\n", + "By default, the output can be seen in the cell output or on the command line as standard output. This can be changed to store the output in a log file. For more details, it is recommended to follow the [documentation](https://github.com/pythonprofilers/memory_profiler?tab=readme-ov-file#reporting)." + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "id": "24518fe3-973e-4c23-ba46-afb04da2815e", + "metadata": { + "tags": [] + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "ERROR: Could not find file /tmp/ipykernel_314/1328302985.py\n", + "ERROR: Could not find file /tmp/ipykernel_314/1328302985.py\n" + ] + } + ], + "source": [ + "fp=open('memory_profiler.log','w+')\n", + "@profile(stream=fp)\n", + "def my_function():\n", + " # Perform some potentially memory-intensive computation\n", + " \n", + " return 0\n", + "\n", + "@profile(stream=fp)\n", + "def my_other_function():\n", + " # Perform some potentially memory-intensive computation\n", + " \n", + " return 0\n", + "\n", + "def main():\n", + " my_function()\n", + " my_other_function()\n", + " \n", + " #...\n", + "\n", + "if __name__ == \"__main__\":\n", + " main()" + ] + }, + { + "cell_type": "markdown", + "id": "56291280-e0ad-409b-bce2-0c96c07664e7", + "metadata": {}, + "source": [ + "To test the logging, we will run memory profiling on the `demo_memory_profiling_logging.py` script saved in the working directory." + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "id": "98bbc844-b02a-4269-ad13-f8361157be52", + "metadata": { + "tags": [] + }, + "outputs": [], + "source": [ + "!python demo_memory_profiling_logging.py" + ] + }, + { + "cell_type": "markdown", + "id": "c8a2b85d-9da8-4246-927b-00cf4e20f296", + "metadata": {}, + "source": [ + "After executing the above script, we can see that the memory profiling output is saved in the `memory_profiler.log` file. You can also log profiling output to different log files for different functions by defining a separate logging file in the argument `fp`. " + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "vanilla", + "language": "python", + "name": "vanilla" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.10.13" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/docs/source/technical_tutorials/visualization/interval_color_mapping.ipynb b/docs/source/technical_tutorials/visualization/interval_color_mapping.ipynb index dc7ace14..907a8c0b 100644 --- a/docs/source/technical_tutorials/visualization/interval_color_mapping.ipynb +++ b/docs/source/technical_tutorials/visualization/interval_color_mapping.ipynb @@ -37,6 +37,8 @@ "metadata": {}, "source": [ "## Additional Resources \n", + "- [Cloud Native Geoguide](https://guide.cloudnativegeo.org/)\n", + "- [Examples of Working with COGs](https://guide.cloudnativegeo.org/cloud-optimized-geotiffs/cogs-examples.html)\n", "- [Predefined Color Maps](https://matplotlib.org/3.1.0/tutorials/colors/colormaps.html)\n", "- [CSS RGBA Colors](https://www.w3schools.com/css/css3_colors.asp)\n", "- [Using Python Zip Function](https://www.w3schools.com/python/ref_func_zip.asp)\n" @@ -465,7 +467,7 @@ ], "metadata": { "kernelspec": { - "display_name": "Python 3.11.2 64-bit", + "display_name": "Python 3 (ipykernel)", "language": "python", "name": "python3" }, @@ -479,7 +481,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.11.2" + "version": "3.10.13" }, "vscode": { "interpreter": {