pangeo-forge · cisaacstern · Dec 13, 2022 · Nov 9, 2022 · Nov 16, 2022 · Nov 16, 2022
diff --git a/recipes/aws-noaa-whoi/meta.yaml b/recipes/aws-noaa-whoi/meta.yaml
@@ -0,0 +1,26 @@
+title: 'AWS NOAA WHOI SST'
+description: 'Analysis-ready datasets derived from AWS NOAA WHOI NetCDF'
+pangeo_forge_version: '0.9.2'
+pangeo_notebook_version: '2021.07.17'
+recipes:
+  - id: aws-noaa-sea-surface-temp-whoi
+    object: 'recipe:recipe'
+provenance:
+  providers:
+    - name: 'AWS NOAA Oceanic CDR'
+      description: 'Registry of Open Data on AWS National Oceanographic & Atmospheric Administration National Centers for Environmental Information'
+      roles:
+        - producer
+        - licensor
+      url: s3://noaa-cdr-sea-surface-temp-whoi-pds/
+  license: 'Open Data'
+maintainers:
+  - name: 'Kathryn Berger'
+    orcid: '0000-0001-9731-6519'
+    github: kathrynberger
+bakery:
+  id: 'devseed.bakery.development.aws.us-west-2' # must come from a valid list of bakeries
+  target: pangeo-forge-aws-bakery-flowcachebucketdasktest4-10neo67y7a924
+  resources:
+    memory: 4096
+    cpu: 1024
diff --git a/recipes/aws-noaa-whoi/recipe.py b/recipes/aws-noaa-whoi/recipe.py
@@ -0,0 +1,21 @@
+import pandas as pd
+
+from pangeo_forge_recipes.patterns import ConcatDim, FilePattern
+from pangeo_forge_recipes.recipes.reference_hdf_zarr import HDFReferenceRecipe
+
+start_date = '1988-01-01'
+
+
+def format_function(time):
+    base = pd.Timestamp(start_date)
+    day = base + pd.Timedelta(days=time)
+    input_url_pattern = (
+        's3://noaa-cdr-sea-surface-temp-whoi-pds/data/{day:%Y}'
+        '/SEAFLUX-OSB-CDR_V02R00_SST_D{day:%Y%m%d}_C*.nc'
+    )
+    return input_url_pattern.format(day=day)
+
+
+dates = pd.date_range(start_date, '2022-11-08', freq='D')
+pattern = FilePattern(format_function, ConcatDim('time', range(len(dates)), 1))
+recipe = HDFReferenceRecipe(pattern, netcdf_storage_options={'anon': True})