e-marshall
diff --git a/‎.codespellignore
+10 b/‎.codespellignore
+10
diff --git a/‎.gitignore
+10-1 b/‎.gitignore
+10-1
diff --git a/‎.pre-commit-config.yaml
+9-1 b/‎.pre-commit-config.yaml
+9-1
diff --git a/‎book/_config.yml
+5-3 b/‎book/_config.yml
+5-3
diff --git a/‎book/_toc.yml
+21-19 b/‎book/_toc.yml
+21-19
diff --git a/‎book/background/context_motivation.md renamed to ‎book/background/1_context_motivation.md
+14-9 b/‎book/background/context_motivation.md renamed to ‎book/background/1_context_motivation.md
+14-9
@@ -0,0 +1,10 @@
+ "Xarray",
+"geospatial",
+"CEOS",
+"backscatter",
+"Dask",
+"Zarr",
+"geoscience",
+"STAC", "stackstac", "PySTAC", "Zenodo", "USGS","SERVIR","NSIDC","shapefile","pixi","itslive",
+"jovyan","kernelspec","regridding","Pangeo","Xvec"
+"basemaps","matplotlib","fontsize","skipna","linestyle","GDAL"
@@ -2,8 +2,17 @@
 _build 
 _static 
 
+#scratch
+all_links.txt
+node_modules/
+package-lock.json
+package.json
+utils/get_links.py
+
 #Data 
-**/data/raster_data/*
+sentinel1/data/raster_data/*
+itslive/data/raster_data/*
+#itslive/data/raster_data/single_glacier_itslive.zarr/*
 
 #Extra nbs
 sentinel1/subste_nbs
 
@@ -12,7 +12,7 @@ repos:
     rev: 1.9.1  # Check latest version
     hooks:
       - id: nbqa-flake8
-        args: ["--max-line-length=120"]  
+        args: ["--max-line-length=88","--ignore=E402"] #ignore module import not at top of file  
         files: "\\.ipynb$" 
       - id: nbqa-black
         args: ["--line-length=120"]
@@ -41,3 +41,11 @@ repos:
     hooks:
       - id: markdown-link-check
         args: [-q]
+
+  - repo: https://github.com/codespell-project/codespell
+    rev: v2.4.1
+    hooks:
+    - id: codespell
+      #files: ^.*\.(py|md|ipynb)$
+      args: ["--ignore-words", ".codespellignore", "--skip=*.bib", "--skip=*.lock","--skip=run_itslive_nbs.py"]
+     
@@ -53,6 +53,8 @@ parse:
     - substitution
 sphinx:
   config:
+    # application/vnd.holoviews_load.v0+json, application/vnd.holoviews_exec.v0+json
+    suppress_warnings: ["mystnb.unknown_mime_type"]
     bibtex_reference_style: label
     myst_heading_anchors: 3
     myst_enable_extensions:
@@ -68,12 +70,12 @@ sphinx:
     - substitution
 
     myst_substitutions:
-      part1_title: "Background"
+      part1_title: "Part 2: Background"
       part2_title: "ITS_LIVE ice velocity data tutorial"
       #part2_title: "Using Xarray to examine cloud-based glacier surface velocity data"
       part3_title: "Sentinel-1 RTC imagery tutorial"
       #part3_title:  "Sentinel-1 RTC data workflows with xarray"
-      part4_title: "Summary + Conclusion"
+      part4_title: "Part 5: Conclusion"
 
       #tutorial 1 nb titles
       title_its_nb1: "# 3.1 Accessing cloud-hosted ITS_LIVE data"
@@ -122,7 +124,7 @@ sphinx:
       a_its_nb2: "A. Compare approaches for reading larger than memory data"
       a1_its_nb2: "1) `chunks = 'auto'`"
       a2_its_nb2: "2) `chunks = {}`"
-      a3_its_nb2: "3) An out-of-order time dimensions"
+      a3_its_nb2: "3) An out-of-order time dimension"
       a4_its_nb2: "4) Read the dataset without Dask"
       b_its_nb2: "B. Organize data once it's in memory"
       b1_its_nb2: "1) Arrange dataset in chronological order"
 
@@ -4,33 +4,35 @@ root: introduction
 parts:
   - caption: Part 1. Introduction
     chapters:
-    - file: intro/getting_started
-    - file: intro/learning_objectives
-    - file: intro/open_source_setting
+    - file: intro/1_getting_started
+    - file: intro/2_learning_objectives
+    - file: intro/3_open_source_setting
   - caption: Part 2. Background
     chapters:
-    - file: background/context_motivation
-    - file: background/data_cubes
-    - file: background/tutorials_overview
-    - file: background/tutorial_data
-    - file: background/software
-    - file: background/relevant_concepts
+    - file: background/background.md
+    - file: background/1_context_motivation
+    #- file: background/ard_data_tidying
+    - file: background/2_data_cubes
+    - file: background/3_tutorials_overview
+    - file: background/4_tutorial_data
+    - file: background/5_software
+    - file: background/6_relevant_concepts
   - caption: Part 3. ITS_LIVE Tutorial
     chapters:
     - file: itslive/itslive_intro
-    - file: itslive/nbs/accessing_itslive_s3_data
-    - file: itslive/nbs/larger_than_memory_data
-    - file: itslive/nbs/combining_raster_vector_data
-    - file: itslive/nbs/exploratory_data_analysis_single
-    - file: itslive/nbs/exploratory_data_analysis_group
+    - file: itslive/nbs/1_accessing_itslive_s3_data
+    - file: itslive/nbs/2_larger_than_memory_data
+    - file: itslive/nbs/3_combining_raster_vector_data
+    - file: itslive/nbs/4_exploratory_data_analysis_single
+    - file: itslive/nbs/5_exploratory_data_analysis_group
   - caption: Part 4. Sentinel-1 RTC Tutorial
     chapters:
     - file: sentinel1/s1_intro
-    - file: sentinel1/nbs/read_asf_data
-    - file: sentinel1/nbs/wrangle_metadata
-    - file: sentinel1/nbs/asf_exploratory_analysis
-    - file: sentinel1/nbs/read_pc_data
-    - file: sentinel1/nbs/comparing_s1_rtc_datasets
+    - file: sentinel1/nbs/1_read_asf_data
+    - file: sentinel1/nbs/2_wrangle_metadata
+    - file: sentinel1/nbs/3_asf_exploratory_analysis
+    - file: sentinel1/nbs/4_read_pc_data
+    - file: sentinel1/nbs/5_comparing_s1_rtc_datasets
   - caption: Part 5. Conclusion
     chapters:
     - file: conclusion/wrapping_up
 
@@ -1,28 +1,33 @@
 # 2.1 Context & Motivation
 
-This book demonstrates scientific workflows using publicly-available, cloud-optimized geospatial datasets and open-source scientific software tools in order to address the need for educational resources related to new technologies and reduce barriers to entry to working with earth observation data. The tutorials in this book focus on the complexities inherent to working with n-dimensional, gridded datasets and use the core stack of software packages built on and around the Xarray data model.
+This book demonstrates scientific workflows using publicly available, cloud-optimized geospatial datasets and open-source scientific software tools in order to address the need for educational resources related to new technologies and reduce barriers to entry to working with earth observation data. The tutorials in this book focus on the complexities inherent to working with n-dimensional, gridded datasets and use the core stack of software packages built on and around the Xarray data model.
 
-### *Moving away from the 'download model' of scientific data analysis*
+## *Moving away from the 'download model' of scientific data analysis*
 
-Technological developments in recent decades have engendered fundamental shifts in the nature of scientific data and how it is used for analysis.
+Technological developments in recent decades have engendered fundamental shifts in the nature of scientific data and how it is used for analysis ({cite:t}`abernathey_2021_cloud,gentemann_2021_science,stern_2022_PangeoForge`).
 
 ```{epigraph}
 "Traditionally, scientific data have been distributed via a “download model,” wherein scientists download individual data files to local computers for analysis. After downloading many files, scientists typically have to do extensive processing and organizing to make them useful for the data analysis; this creates a barrier to reproducibility, since a scientist’s analysis code must account for this unique “local” organization. Furthermore, the sheer size of the datasets (many terabytes to petabytes) can make downloading effectively impossible. Analysis of such data volumes also can benefit from parallel / distributed computing, which is not always readily available on local computers. Finally, this model reinforces inequality between privileged institutions that have the resources to host local copies of the data and those that don’t. This restricts who can participate in science."
--- {cite}`abernathey_2021_cloud`
+-- {cite:t}`abernathey_2021_cloud`
 ```
 
-### *Increasingly large, cloud-optimized data means new tools and approaches for data management*
+## *Increasingly large, cloud-optimized data means new tools and approaches for data management*
 
-The increase in publicly available earth observation data has transformed scientific workflows across a range of fields, prompting analysts to gain new skills in order to work with larger volumes of data in new formats and locations, and to use distributed cloud-computational resources in their analysis ({cite:t}`abernathey_2021_cloud,gentemann_2021_science,mathieu_2017_esas,ramachandran_2021_open,Sudmanns_2020_big,wagemann_2021_user`). 
+The increase in publicly available earth observation data has transformed scientific workflows across a range of fields, prompting analysts to gain new skills in order to work with larger volumes of data in new formats and locations, and to use distributed cloud-computational resources in their analysis ({cite:t}`abernathey_2021_cloud,Boulton02012018,gentemann_2021_science,mathieu_2017_esas,ramachandran_2021_open,Sudmanns_2020_big,wagemann_2021_user`). 
 
 ```{figure} imgs/fy24-projection-chart.png
 ---
 ---
 Volume of NASA Earth Science Data archives, including growth of existing-mission archives and new missions, projected through 2029. Source: [NASA EarthData - Open Science](https://www.earthdata.nasa.gov/about/open-science).
 ```
 
-### *Asking questions of complex datasets*
+## *Asking questions of complex datasets*
 
-Scientific workflows involve asking complex questions of diverse types of data. Earth observation and related datasets often contain two types of information: measurements of a physical observable (e.g. temperature) and metadata that provides auxiliary information that required in order to interpret the physical observable (time and location of measurement, information about the sensor, etc.). With the increasingly complex and large volume of earth observation data that is currently available, storing, managing and organizing these types of data can very quickly become a complex and challenging task, especially for students and early-career analysts {cite}`mathieu_esas_2017,palumbo_2017_building,Sudmanns_2020_big,wagemann_2021_user`. 
+Scientific workflows involve asking complex questions of diverse types of data. Earth observation and related datasets often contain two types of information: measurements of a physical observable (e.g. temperature) and metadata that provides auxiliary information that required in order to interpret the physical observable (time and location of measurement, information about the sensor, etc.). With the increasingly complex and large volume of earth observation data that is currently available, storing, managing and organizing this information can very quickly become a complex and challenging task, especially for students and early-career analysts ({cite:t}`mathieu_2017_esas,palumbo_2017_building,Sudmanns_2020_big,wagemann_2021_user,stern_2022_PangeoForge`). 
 
-This book provides detailed examples of scientific workflow steps that ingest complex, multi-dimensional datastets, introduce users to the landscape of popular, actively-maintained open-source software packages for working with geospatial data in Python, and include strategies for working with larger-than memory data stored in publicly available, cloud-hosted repositories. These demonstrations are accompanied by detailed discussion of concepts involved in analyzing earth observation data such as dataset inspection, manipulation, and exploratory analysis and visualization. Overall, we emphasize the importance of understanding the structure of multi-dimensional earth observation datasets within the context of a given data model and demonstrate how such an understanding can enable more efficient and intuitive scientific workflows. 
+This book provides detailed examples of scientific workflow steps that ingest complex, multi-dimensional datasets, introduce users to the landscape of popular, actively-maintained open-source software packages for working with geospatial data in Python, and include strategies for working with larger-than memory data stored in publicly available, cloud-hosted repositories. These demonstrations are accompanied by detailed discussion of concepts involved in analyzing earth observation data such as dataset inspection, manipulation, and exploratory analysis and visualization. Overall, we emphasize the importance of understanding the structure of multi-dimensional earth observation datasets within the context of a given data model and demonstrate how such an understanding can enable more efficient and intuitive scientific workflows. 
+
+
+
+
+