From 10d1678b2ec25187fef758c30805a3074ce10cef Mon Sep 17 00:00:00 2001 From: GitHub Action Date: Thu, 9 Jan 2025 04:58:37 +0000 Subject: [PATCH] Updated datasets 2025-01-09 UTC --- aws_open_datasets.json | 746 +++++++++++++++-------------- aws_open_datasets.tsv | 139 +++--- datasets/satellogic-earthview.yaml | 30 ++ 3 files changed, 488 insertions(+), 427 deletions(-) create mode 100644 datasets/satellogic-earthview.yaml diff --git a/aws_open_datasets.json b/aws_open_datasets.json index b6dcdcb..da738e7 100644 --- a/aws_open_datasets.json +++ b/aws_open_datasets.json @@ -17233,8 +17233,8 @@ }, { "Name": "NOAA Atmospheric Climate Data Records", - "Description": "Cloud Properties Polar Orbiter", - "ARN": "arn:aws:s3:::noaa-cdr-cloud-properties-polar-orbiter-nasa-pds", + "Description": "Hydrological Properties", + "ARN": "arn:aws:s3:::noaa-cdr-hydrological-properties-pds", "Region": "us-east-1", "Type": "S3 Bucket", "Documentation": "https://www.ncei.noaa.gov/products/climate-data-records/atmospheric", @@ -17251,7 +17251,7 @@ "weather" ], "Explore": [ - "[Browse Bucket](https://noaa-cdr-cloud-properties-polar-orbiter-nasa-pds.s3.amazonaws.com/index.html)" + "[Browse Bucket](https://noaa-cdr-hydrological-properties-pds.s3.amazonaws.com/index.html)" ], "RequesterPays": null, "ControlledAccess": null, @@ -17287,8 +17287,8 @@ }, { "Name": "NOAA Atmospheric Climate Data Records", - "Description": "Hydrological Properties", - "ARN": "arn:aws:s3:::noaa-cdr-hydrological-properties-pds", + "Description": "Cloud Properties Polar Orbiter", + "ARN": "arn:aws:s3:::noaa-cdr-cloud-properties-polar-orbiter-nasa-pds", "Region": "us-east-1", "Type": "S3 Bucket", "Documentation": "https://www.ncei.noaa.gov/products/climate-data-records/atmospheric", @@ -17305,7 +17305,7 @@ "weather" ], "Explore": [ - "[Browse Bucket](https://noaa-cdr-hydrological-properties-pds.s3.amazonaws.com/index.html)" + "[Browse Bucket](https://noaa-cdr-cloud-properties-polar-orbiter-nasa-pds.s3.amazonaws.com/index.html)" ], "RequesterPays": null, "ControlledAccess": null, @@ -18433,10 +18433,10 @@ }, { "Name": "NOAA Global Data Assimilation (DA) Test Data", - "Description": "Global Data Assimilation (DA) System Test Data", - "ARN": "arn:aws:s3:::noaa-ufs-gdas-pds", + "Description": "New data notifications for Global Data Assimilation (DA) System Test Data, only Lambda and SQS protocols allowed", + "ARN": "arn:aws:sns:us-east-1:709902155096:NewNWSUFSGDASObject", "Region": "us-east-1", - "Type": "S3 Bucket", + "Type": "SNS Topic", "Documentation": "https://github.com/NOAA-EMC/GDASApp/wiki", "Contact": "For questions regarding data content or quality, post on the ufs-community forum at https://github.com/orgs/ufs-community/discussions or email support.epic@noaa.gov. For any questions regarding data delivery or any general questions regarding the NOAA Open Data Dissemination (NODD) Program, email the NODD Team at nodd@noaa.gov.
We also seek to identify case studies on how NOAA data is being used and will be featuring those stories in joint publications and in upcoming events. If you are interested in seeing your story highlighted, please share it with the NODD team by emailing nodd@noaa.gov", "ManagedBy": "[NOAA](http://www.noaa.gov/)", @@ -18451,9 +18451,7 @@ "meteorological", "weather" ], - "Explore": [ - "[Browse Bucket](https://noaa-ufs-gdas-pds.s3.amazonaws.com/index.html)" - ], + "Explore": null, "RequesterPays": null, "ControlledAccess": null, "AccountRequired": null, @@ -18461,10 +18459,10 @@ }, { "Name": "NOAA Global Data Assimilation (DA) Test Data", - "Description": "New data notifications for Global Data Assimilation (DA) System Test Data, only Lambda and SQS protocols allowed", - "ARN": "arn:aws:sns:us-east-1:709902155096:NewNWSUFSGDASObject", + "Description": "Global Data Assimilation (DA) System Test Data", + "ARN": "arn:aws:s3:::noaa-ufs-gdas-pds", "Region": "us-east-1", - "Type": "SNS Topic", + "Type": "S3 Bucket", "Documentation": "https://github.com/NOAA-EMC/GDASApp/wiki", "Contact": "For questions regarding data content or quality, post on the ufs-community forum at https://github.com/orgs/ufs-community/discussions or email support.epic@noaa.gov. For any questions regarding data delivery or any general questions regarding the NOAA Open Data Dissemination (NODD) Program, email the NODD Team at nodd@noaa.gov.
We also seek to identify case studies on how NOAA data is being used and will be featuring those stories in joint publications and in upcoming events. If you are interested in seeing your story highlighted, please share it with the NODD team by emailing nodd@noaa.gov", "ManagedBy": "[NOAA](http://www.noaa.gov/)", @@ -18479,7 +18477,9 @@ "meteorological", "weather" ], - "Explore": null, + "Explore": [ + "[Browse Bucket](https://noaa-ufs-gdas-pds.s3.amazonaws.com/index.html)" + ], "RequesterPays": null, "ControlledAccess": null, "AccountRequired": null, @@ -19715,8 +19715,8 @@ }, { "Name": "NOAA National Water Model CONUS Retrospective Dataset", - "Description": "The complete archive of NWM input forcing and model output data version 30 in NetCDF and Zarr format", - "ARN": "arn:aws:s3:::noaa-nwm-retrospective-3-0-pds", + "Description": "The complete archive of NWM model output data version 21 in Zarr format The NWM precipitation input forcing in Zarr format", + "ARN": "arn:aws:s3:::noaa-nwm-retrospective-2-1-zarr-pds", "Region": "us-east-1", "Type": "S3 Bucket", "Documentation": "https://github.com/NOAA-Big-Data-Program/bdp-data-docs/blob/main/nwm/README.md", @@ -19735,7 +19735,7 @@ "transportation" ], "Explore": [ - "[Browse Bucket](https://noaa-nwm-retrospective-3-0-pds.s3.amazonaws.com/index.html)" + "[Browse Bucket](https://noaa-nwm-retrospective-2-1-zarr-pds.s3.amazonaws.com/index.html)" ], "RequesterPays": null, "ControlledAccess": null, @@ -19802,8 +19802,8 @@ }, { "Name": "NOAA National Water Model CONUS Retrospective Dataset", - "Description": "The complete archive of NWM input forcing and model output data version 21 in NetCDF format", - "ARN": "arn:aws:s3:::noaa-nwm-retrospective-2-1-pds", + "Description": "The complete archive of NWM input forcing and model output data version 30 in NetCDF and Zarr format", + "ARN": "arn:aws:s3:::noaa-nwm-retrospective-3-0-pds", "Region": "us-east-1", "Type": "S3 Bucket", "Documentation": "https://github.com/NOAA-Big-Data-Program/bdp-data-docs/blob/main/nwm/README.md", @@ -19822,7 +19822,7 @@ "transportation" ], "Explore": [ - "[Browse Bucket](https://noaa-nwm-retrospective-2-1-pds.s3.amazonaws.com/index.html)" + "[Browse Bucket](https://noaa-nwm-retrospective-3-0-pds.s3.amazonaws.com/index.html)" ], "RequesterPays": null, "ControlledAccess": null, @@ -19831,8 +19831,8 @@ }, { "Name": "NOAA National Water Model CONUS Retrospective Dataset", - "Description": "The complete archive of NWM model output data version 21 in Zarr format The NWM precipitation input forcing in Zarr format", - "ARN": "arn:aws:s3:::noaa-nwm-retrospective-2-1-zarr-pds", + "Description": "The complete archive of NWM input forcing and model output data version 21 in NetCDF format", + "ARN": "arn:aws:s3:::noaa-nwm-retrospective-2-1-pds", "Region": "us-east-1", "Type": "S3 Bucket", "Documentation": "https://github.com/NOAA-Big-Data-Program/bdp-data-docs/blob/main/nwm/README.md", @@ -19851,7 +19851,7 @@ "transportation" ], "Explore": [ - "[Browse Bucket](https://noaa-nwm-retrospective-2-1-zarr-pds.s3.amazonaws.com/index.html)" + "[Browse Bucket](https://noaa-nwm-retrospective-2-1-pds.s3.amazonaws.com/index.html)" ], "RequesterPays": null, "ControlledAccess": null, @@ -20759,10 +20759,10 @@ }, { "Name": "NOAA U.S. Climate Gridded Dataset (NClimGrid)", - "Description": "New data notifications for Daily NClimGrid, only Lambda and SQS protocols allowed", - "ARN": "arn:aws:sns:us-east-1:123901341784:NewNClimGridMonthlyObject", + "Description": "Monthly NClimGrid Data", + "ARN": "arn:aws:s3:::noaa-nclimgrid-monthly-pds", "Region": "us-east-1", - "Type": "SNS Topic", + "Type": "S3 Bucket", "Documentation": "https://www.ncei.noaa.gov/access/metadata/landing-page/bin/iso?id=gov.noaa.ncdc:C00332", "Contact": "For any questions regarding data delivery or any general questions regarding the NOAA Open Data Dissemination (NODD) Program, email the NODD Team at nodd@noaa.gov.
We also seek to identify case studies on how NOAA data is being used and will be featuring those stories in joint publications and in upcoming events. If you are interested in seeing your story highlighted, please share it with the NODD team by emailing nodd@noaa.gov", "ManagedBy": "[NOAA](http://www.noaa.gov/)", @@ -20775,7 +20775,9 @@ "meteorological", "weather" ], - "Explore": null, + "Explore": [ + "[Browse Bucket](https://noaa-nclimgrid-monthly-pds.s3.amazonaws.com/index.html)" + ], "RequesterPays": null, "ControlledAccess": null, "AccountRequired": null, @@ -20783,10 +20785,10 @@ }, { "Name": "NOAA U.S. Climate Gridded Dataset (NClimGrid)", - "Description": "Monthly NClimGrid Data", - "ARN": "arn:aws:s3:::noaa-nclimgrid-monthly-pds", + "Description": "New data notifications for Daily NClimGrid, only Lambda and SQS protocols allowed", + "ARN": "arn:aws:sns:us-east-1:123901341784:NewNClimGridMonthlyObject", "Region": "us-east-1", - "Type": "S3 Bucket", + "Type": "SNS Topic", "Documentation": "https://www.ncei.noaa.gov/access/metadata/landing-page/bin/iso?id=gov.noaa.ncdc:C00332", "Contact": "For any questions regarding data delivery or any general questions regarding the NOAA Open Data Dissemination (NODD) Program, email the NODD Team at nodd@noaa.gov.
We also seek to identify case studies on how NOAA data is being used and will be featuring those stories in joint publications and in upcoming events. If you are interested in seeing your story highlighted, please share it with the NODD team by emailing nodd@noaa.gov", "ManagedBy": "[NOAA](http://www.noaa.gov/)", @@ -20799,9 +20801,7 @@ "meteorological", "weather" ], - "Explore": [ - "[Browse Bucket](https://noaa-nclimgrid-monthly-pds.s3.amazonaws.com/index.html)" - ], + "Explore": null, "RequesterPays": null, "ControlledAccess": null, "AccountRequired": null, @@ -21353,10 +21353,10 @@ }, { "Name": "NOAA Whole Atmosphere Model-Ionosphere Plasmasphere Electrodynamics (WAM-IPE) Forecast System (WFS)", - "Description": "New data notifications for NOAA WAM-IPE Products, only Lambda and SQS protocols allowed", - "ARN": "arn:aws:sns:us-east-1:709902155096:NewWIFSObject", + "Description": "NOAA WAM-IPE Products", + "ARN": "arn:aws:s3:::noaa-nws-wam-ipe-pds", "Region": "us-east-1", - "Type": "SNS Topic", + "Type": "S3 Bucket", "Documentation": "https://www.swpc.noaa.gov/products/wam-ipe", "Contact": "For any questions regarding WAM-IPE data, please contact Adam Kubaryk (adam.kubaryk@noaa.gov) and/or Tzu-Wei Fang (tzu-wei.fang@noaa.gov) For data delivery or any general questions regarding the NOAA Open Data Dissemination (NODD) Program, email the NODD Team at nodd@noaa.gov.
We also seek to identify case studies on how NOAA data is being used and will be featuring those stories in joint publications and in upcoming events. If you are interested in seeing your story highlighted, please share it with the NODD team by emailing nodd@noaa.gov", "ManagedBy": "[NOAA](http://www.noaa.gov/)", @@ -21369,7 +21369,9 @@ "solar", "weather" ], - "Explore": null, + "Explore": [ + "[Browse Bucket](https://noaa-nws-wam-ipe-pds.s3.amazonaws.com/index.html)" + ], "RequesterPays": null, "ControlledAccess": null, "AccountRequired": null, @@ -21377,10 +21379,10 @@ }, { "Name": "NOAA Whole Atmosphere Model-Ionosphere Plasmasphere Electrodynamics (WAM-IPE) Forecast System (WFS)", - "Description": "NOAA WAM-IPE Products", - "ARN": "arn:aws:s3:::noaa-nws-wam-ipe-pds", + "Description": "New data notifications for NOAA WAM-IPE Products, only Lambda and SQS protocols allowed", + "ARN": "arn:aws:sns:us-east-1:709902155096:NewWIFSObject", "Region": "us-east-1", - "Type": "S3 Bucket", + "Type": "SNS Topic", "Documentation": "https://www.swpc.noaa.gov/products/wam-ipe", "Contact": "For any questions regarding WAM-IPE data, please contact Adam Kubaryk (adam.kubaryk@noaa.gov) and/or Tzu-Wei Fang (tzu-wei.fang@noaa.gov) For data delivery or any general questions regarding the NOAA Open Data Dissemination (NODD) Program, email the NODD Team at nodd@noaa.gov.
We also seek to identify case studies on how NOAA data is being used and will be featuring those stories in joint publications and in upcoming events. If you are interested in seeing your story highlighted, please share it with the NODD team by emailing nodd@noaa.gov", "ManagedBy": "[NOAA](http://www.noaa.gov/)", @@ -21393,9 +21395,7 @@ "solar", "weather" ], - "Explore": [ - "[Browse Bucket](https://noaa-nws-wam-ipe-pds.s3.amazonaws.com/index.html)" - ], + "Explore": null, "RequesterPays": null, "ControlledAccess": null, "AccountRequired": null, @@ -22438,8 +22438,8 @@ }, { "Name": "NREL Wind Integration National Dataset", - "Description": "Bias corrected Indonesia wind resource", - "ARN": "arn:aws:s3:::nrel-pds-wtk/indonesia/", + "Description": "California offshore wind resource data (2000-2022) in HDF5 format", + "ARN": "arn:aws:s3:::nrel-pds-wtk/now23_california/", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://www.nrel.gov/grid/wind-toolkit.html", @@ -22454,7 +22454,7 @@ "meteorological" ], "Explore": [ - "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=indonesia%2F)" + "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=now23_california%2F)" ], "RequesterPays": null, "ControlledAccess": null, @@ -22463,8 +22463,8 @@ }, { "Name": "NREL Wind Integration National Dataset", - "Description": "Mid Atlantic wind resource data with modeled wakes in HDF5 format", - "ARN": "arn:aws:s3:::nrel-pds-wtk/NOW-WAKES_Mid_Atlantic/", + "Description": "Bias corrected Indonesia wind resource", + "ARN": "arn:aws:s3:::nrel-pds-wtk/indonesia/", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://www.nrel.gov/grid/wind-toolkit.html", @@ -22479,7 +22479,7 @@ "meteorological" ], "Explore": [ - "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=NOW-WAKES_Mid_Atlantic%2F)" + "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=indonesia%2F)" ], "RequesterPays": null, "ControlledAccess": null, @@ -22488,8 +22488,8 @@ }, { "Name": "NREL Wind Integration National Dataset", - "Description": "Southeast Asia wind resource data v3 (2007-2021) in HDF5 format", - "ARN": "arn:aws:s3:::nrel-pds-wtk/seasiawind_v3/", + "Description": "Mid Atlantic wind resource data with modeled wakes in HDF5 format", + "ARN": "arn:aws:s3:::nrel-pds-wtk/NOW-WAKES_Mid_Atlantic/", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://www.nrel.gov/grid/wind-toolkit.html", @@ -22504,7 +22504,7 @@ "meteorological" ], "Explore": [ - "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=seasiawind_v3%2F)" + "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=NOW-WAKES_Mid_Atlantic%2F)" ], "RequesterPays": null, "ControlledAccess": null, @@ -22513,8 +22513,8 @@ }, { "Name": "NREL Wind Integration National Dataset", - "Description": "Southeast Asia wind resource data v2 (2007-2021) in HDF5 format", - "ARN": "arn:aws:s3:::nrel-pds-wtk/seasiawind_v2/", + "Description": "Southeast Asia wind resource data v3 (2007-2021) in HDF5 format", + "ARN": "arn:aws:s3:::nrel-pds-wtk/seasiawind_v3/", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://www.nrel.gov/grid/wind-toolkit.html", @@ -22529,7 +22529,7 @@ "meteorological" ], "Explore": [ - "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=seasiawind_v2%2F)" + "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=seasiawind_v3%2F)" ], "RequesterPays": null, "ControlledAccess": null, @@ -22538,8 +22538,8 @@ }, { "Name": "NREL Wind Integration National Dataset", - "Description": "Data for the Eastern Wind Integration Study (2004-2006", - "ARN": "arn:aws:s3:::nrel-pds-wtk/eastern_wind/", + "Description": "Southeast Asia wind resource data v2 (2007-2021) in HDF5 format", + "ARN": "arn:aws:s3:::nrel-pds-wtk/seasiawind_v2/", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://www.nrel.gov/grid/wind-toolkit.html", @@ -22554,7 +22554,7 @@ "meteorological" ], "Explore": [ - "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=eastern_wind%2F)" + "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=seasiawind_v2%2F)" ], "RequesterPays": null, "ControlledAccess": null, @@ -22588,8 +22588,8 @@ }, { "Name": "NREL Wind Integration National Dataset", - "Description": "California offshore wind resource data (2000-2022) in HDF5 format", - "ARN": "arn:aws:s3:::nrel-pds-wtk/now23_california/", + "Description": "South Atlantic offshore wind resource data (2000-2020) in HDF5 format", + "ARN": "arn:aws:s3:::nrel-pds-wtk/south_atlantic/", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://www.nrel.gov/grid/wind-toolkit.html", @@ -22604,7 +22604,7 @@ "meteorological" ], "Explore": [ - "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=now23_california%2F)" + "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=south_atlantic)" ], "RequesterPays": null, "ControlledAccess": null, @@ -22663,8 +22663,8 @@ }, { "Name": "NREL Wind Integration National Dataset", - "Description": "Mid Atlantic three-dimensional planetary boundary layer (3D PBL) scheme wind resource data", - "ARN": "arn:aws:s3:::nrel-pds-wtk/mid_atlantic_3d_pbl/", + "Description": "Bias Corrected NOAA HRRR Wind Resource Data for Grid Integration Applications", + "ARN": "arn:aws:s3:::nrel-pds-wtk/bchrrr/", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://www.nrel.gov/grid/wind-toolkit.html", @@ -22679,7 +22679,7 @@ "meteorological" ], "Explore": [ - "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=mid_atlantic_3d_pbl%2F)" + "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=bchrrr%2F)" ], "RequesterPays": null, "ControlledAccess": null, @@ -22713,8 +22713,8 @@ }, { "Name": "NREL Wind Integration National Dataset", - "Description": "Bias Corrected NOAA HRRR Wind Resource Data for Grid Integration Applications", - "ARN": "arn:aws:s3:::nrel-pds-wtk/bchrrr/", + "Description": "Data for the Eastern Wind Integration Study (2004-2006", + "ARN": "arn:aws:s3:::nrel-pds-wtk/eastern_wind/", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://www.nrel.gov/grid/wind-toolkit.html", @@ -22729,7 +22729,7 @@ "meteorological" ], "Explore": [ - "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=bchrrr%2F)" + "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=eastern_wind%2F)" ], "RequesterPays": null, "ControlledAccess": null, @@ -22738,8 +22738,8 @@ }, { "Name": "NREL Wind Integration National Dataset", - "Description": "South Atlantic offshore wind resource data (2000-2020) in HDF5 format", - "ARN": "arn:aws:s3:::nrel-pds-wtk/south_atlantic/", + "Description": "Mid Atlantic three-dimensional planetary boundary layer (3D PBL) scheme wind resource data", + "ARN": "arn:aws:s3:::nrel-pds-wtk/mid_atlantic_3d_pbl/", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://www.nrel.gov/grid/wind-toolkit.html", @@ -22754,7 +22754,7 @@ "meteorological" ], "Explore": [ - "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=south_atlantic)" + "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=mid_atlantic_3d_pbl%2F)" ], "RequesterPays": null, "ControlledAccess": null, @@ -25137,10 +25137,10 @@ }, { "Name": "OpenAQ", - "Description": "OpenAQ API", - "ARN": null, + "Description": "SNS topic for new objects in the openaq-data-archive bucket", + "ARN": "arn:aws:sns:us-east-1:817926761842:openaq-data-archive-object_created", "Region": "us-east-1", - "Type": "CloudFront Distribution", + "Type": "SNS Topic", "Documentation": "https://openaq.org", "Contact": "info@openaq.org", "ManagedBy": "[OpenAQ](https://openaq.org)", @@ -25157,14 +25157,14 @@ "RequesterPays": null, "ControlledAccess": null, "AccountRequired": null, - "Host": "api.openaq.org" + "Host": null }, { "Name": "OpenAQ", - "Description": "SNS topic for new objects in the openaq-data-archive bucket", - "ARN": "arn:aws:sns:us-east-1:817926761842:openaq-data-archive-object_created", + "Description": "Daily gzipped CSVs of global air quality measurements fetched from sources all over the world", + "ARN": "arn:aws:s3:::openaq-data-archive", "Region": "us-east-1", - "Type": "SNS Topic", + "Type": "S3 Bucket", "Documentation": "https://openaq.org", "Contact": "info@openaq.org", "ManagedBy": "[OpenAQ](https://openaq.org)", @@ -25185,10 +25185,10 @@ }, { "Name": "OpenAQ", - "Description": "Daily gzipped CSVs of global air quality measurements fetched from sources all over the world", - "ARN": "arn:aws:s3:::openaq-data-archive", + "Description": "OpenAQ API", + "ARN": null, "Region": "us-east-1", - "Type": "S3 Bucket", + "Type": "CloudFront Distribution", "Documentation": "https://openaq.org", "Contact": "info@openaq.org", "ManagedBy": "[OpenAQ](https://openaq.org)", @@ -25205,7 +25205,7 @@ "RequesterPays": null, "ControlledAccess": null, "AccountRequired": null, - "Host": null + "Host": "api.openaq.org" }, { "Name": "OpenAerialMap on AWS", @@ -25235,8 +25235,8 @@ }, { "Name": "OpenAlex dataset", - "Description": "Openalex Entities decomposed to tab-separated columnar files for backward compatibility with Microsoft Academic Graph", - "ARN": "arn:aws:s3:::openalex-mag-format", + "Description": "OpenAlex Entities in JSON Lines format", + "ARN": "arn:aws:s3:::openalex", "Region": "us-east-1", "Type": "S3 Bucket", "Documentation": "https://docs.openalex.org", @@ -25252,7 +25252,7 @@ "aws-pds" ], "Explore": [ - "[Browse Bucket](https://openalex-mag-format.s3.amazonaws.com/browse.html)" + "[Browse Bucket](https://openalex.s3.amazonaws.com/browse.html)" ], "RequesterPays": null, "ControlledAccess": null, @@ -25261,8 +25261,8 @@ }, { "Name": "OpenAlex dataset", - "Description": "OpenAlex Entities in JSON Lines format", - "ARN": "arn:aws:s3:::openalex", + "Description": "Openalex Entities decomposed to tab-separated columnar files for backward compatibility with Microsoft Academic Graph", + "ARN": "arn:aws:s3:::openalex-mag-format", "Region": "us-east-1", "Type": "S3 Bucket", "Documentation": "https://docs.openalex.org", @@ -25278,7 +25278,7 @@ "aws-pds" ], "Explore": [ - "[Browse Bucket](https://openalex.s3.amazonaws.com/browse.html)" + "[Browse Bucket](https://openalex-mag-format.s3.amazonaws.com/browse.html)" ], "RequesterPays": null, "ControlledAccess": null, @@ -25287,9 +25287,9 @@ }, { "Name": "OpenCRAVAT", - "Description": "OpenCRAVAT Store EU", - "ARN": "arn:aws:s3:::opencravat-store-eu-west-2", - "Region": "eu-west-2", + "Description": "OpenCRAVAT Store US", + "ARN": "arn:aws:s3:::opencravat-store-aws", + "Region": "us-east-1", "Type": "S3 Bucket", "Documentation": "https://open-cravat.readthedocs.io", "Contact": "support@opencravat.org", @@ -25313,9 +25313,9 @@ }, { "Name": "OpenCRAVAT", - "Description": "OpenCRAVAT Store US", - "ARN": "arn:aws:s3:::opencravat-store-aws", - "Region": "us-east-1", + "Description": "OpenCRAVAT Store EU", + "ARN": "arn:aws:s3:::opencravat-store-eu-west-2", + "Region": "eu-west-2", "Type": "S3 Bucket", "Documentation": "https://open-cravat.readthedocs.io", "Contact": "support@opencravat.org", @@ -25517,8 +25517,8 @@ }, { "Name": "OpenUniverse 2024 Matched Rubin and Roman Simulations: Preview", - "Description": "The simulated Rubin data products include raw pixel data, calibrated exposures, coadds of the calibrated exposures, and catalogs of photometry measured from the simulated images", - "ARN": "arn:aws:s3:::nasa-irsa-simulations/openuniverse2024/rubin/", + "Description": "The simulated Roman data products include truth files listing the basic physical properties of the simulated astronomical objects; truth images that include the appropriate bandpass and PSF but limited sources of noise; calibrated images that include relevant backgrounds and major sources of noise; and coadded images created using the IMCOM software", + "ARN": "arn:aws:s3:::nasa-irsa-simulations/openuniverse2024/roman/", "Region": "us-east-1", "Type": "S3 Bucket", "Documentation": "https://irsa.ipac.caltech.edu/data/theory/openuniverse2024", @@ -25544,8 +25544,8 @@ }, { "Name": "OpenUniverse 2024 Matched Rubin and Roman Simulations: Preview", - "Description": "The simulated Roman data products include truth files listing the basic physical properties of the simulated astronomical objects; truth images that include the appropriate bandpass and PSF but limited sources of noise; calibrated images that include relevant backgrounds and major sources of noise; and coadded images created using the IMCOM software", - "ARN": "arn:aws:s3:::nasa-irsa-simulations/openuniverse2024/roman/", + "Description": "The simulated Rubin data products include raw pixel data, calibrated exposures, coadds of the calibrated exposures, and catalogs of photometry measured from the simulated images", + "ARN": "arn:aws:s3:::nasa-irsa-simulations/openuniverse2024/rubin/", "Region": "us-east-1", "Type": "S3 Bucket", "Documentation": "https://irsa.ipac.caltech.edu/data/theory/openuniverse2024", @@ -25596,8 +25596,8 @@ }, { "Name": "Orcasound - bioacoustic data for marine conservation", - "Description": "Live-streamed orca audio data (HLS)", - "ARN": "arn:aws:s3:::streaming-orcasound-net", + "Description": "Archived lossless orca audio data (FLAC)", + "ARN": "arn:aws:s3:::archive-orcasound-net", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://github.com/orcasound/orcadata/wiki", @@ -25630,8 +25630,8 @@ }, { "Name": "Orcasound - bioacoustic data for marine conservation", - "Description": "Archived lossless orca audio data (FLAC)", - "ARN": "arn:aws:s3:::archive-orcasound-net", + "Description": "Live-streamed orca audio data (HLS)", + "ARN": "arn:aws:s3:::streaming-orcasound-net", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://github.com/orcasound/orcadata/wiki", @@ -25721,10 +25721,10 @@ }, { "Name": "Overture Maps Foundation Open Map Data", - "Description": "New File Notification", - "ARN": "arn:aws:sns:us-west-2:913550007193:overturemaps-us-west-2", + "Description": "Overture Maps Foundation Data (GeoParquet)", + "ARN": "arn:aws:s3:::overturemaps-us-west-2/release/", "Region": "us-west-2", - "Type": "SNS Topic", + "Type": "S3 Bucket", "Documentation": "Documentation is available at [docs.overturemaps.org](https://docs.overturemaps.org/)", "Contact": "info@overturemaps.org", "ManagedBy": "[Overture Maps Foundation](https://overturemaps.org)", @@ -25747,10 +25747,10 @@ }, { "Name": "Overture Maps Foundation Open Map Data", - "Description": "Overture Maps Foundation Data (GeoParquet)", - "ARN": "arn:aws:s3:::overturemaps-us-west-2/release/", + "Description": "New File Notification", + "ARN": "arn:aws:sns:us-west-2:913550007193:overturemaps-us-west-2", "Region": "us-west-2", - "Type": "S3 Bucket", + "Type": "SNS Topic", "Documentation": "Documentation is available at [docs.overturemaps.org](https://docs.overturemaps.org/)", "Contact": "info@overturemaps.org", "ManagedBy": "[Overture Maps Foundation](https://overturemaps.org)", @@ -25773,8 +25773,8 @@ }, { "Name": "Oxford Nanopore Technologies Benchmark Datasets", - "Description": "Using nanopore sequencing, researchers have directly identified DNA and RNA base modifications at nucleotide resolution, including 5-methylycytosine, 5-hydroxymethylcytosine, N6-methyladenosine, 5-bromodeoxyuridine in DAN; and N6-methyladenosine in RNA, with detection of other natural or synthetic epigenetic modifications possible through training basecalling algorithms One of the most widespread genomic modifications is 5-methylcytosine (5mC), which most frequently occurs at dinucleotides Compared to whole-genome bisulfite sequencing, the traditional method of 5mC detection, nanopore technology can offer many advantagesThe following cell lines/DNA samples were obtained from the NIGMS Human Genetic Cell Repository at the Coriell Institute for Medical Research: GM24385", - "ARN": "arn:aws:s3:::ont-open-data/gm24385_mod_2021.09/extra_analysis/bonito_remora", + "Description": "CpG dinucleotides frequently occur in high-density clusters called CpG islands (CGI) and >60% of human genes have their promoters embedded within CGIs Determining the methylation status of cytosines within CpGs is of substantial biological interest: alterations in methylation patterns within promoters is associated with changes in gene expression and disease states such as cancer Exploring methylation differences between tumour samples and normal samples can help to elucidate mechanisms associated with tumour formation and development Nanopore sequencing enables direct detection of methylated cytosines (eg at CpG sites), without the need for bisulfite conversionOxford Nanopore\u2019s Adaptive Sampling offers a flexible method to enrich regions of interest (eg CGIs) by depleting off-target regions during the sequencing run itself with no upfront sample manipulation Here we introduce Reduced Representation Methylation Sequencing (RRMS) to target 310 Mb of the human genome including regions which are highly enriched for CpGs including ~28,000 CpG islands, ~50,600 shores and ~42,700 shelves as well as ~21,600 promoter regions", + "ARN": "arn:aws:s3:::ont-open-data/rrms_2022.07", "Region": "eu-west-1", "Type": "S3 Bucket", "Documentation": "https://labs.epi2me.io/dataindex/", @@ -25801,8 +25801,8 @@ }, { "Name": "Oxford Nanopore Technologies Benchmark Datasets", - "Description": "CpG dinucleotides frequently occur in high-density clusters called CpG islands (CGI) and >60% of human genes have their promoters embedded within CGIs Determining the methylation status of cytosines within CpGs is of substantial biological interest: alterations in methylation patterns within promoters is associated with changes in gene expression and disease states such as cancer Exploring methylation differences between tumour samples and normal samples can help to elucidate mechanisms associated with tumour formation and development Nanopore sequencing enables direct detection of methylated cytosines (eg at CpG sites), without the need for bisulfite conversionOxford Nanopore\u2019s Adaptive Sampling offers a flexible method to enrich regions of interest (eg CGIs) by depleting off-target regions during the sequencing run itself with no upfront sample manipulation Here we introduce Reduced Representation Methylation Sequencing (RRMS) to target 310 Mb of the human genome including regions which are highly enriched for CpGs including ~28,000 CpG islands, ~50,600 shores and ~42,700 shelves as well as ~21,600 promoter regions", - "ARN": "arn:aws:s3:::ont-open-data/rrms_2022.07", + "Description": "Using nanopore sequencing, researchers have directly identified DNA and RNA base modifications at nucleotide resolution, including 5-methylycytosine, 5-hydroxymethylcytosine, N6-methyladenosine, 5-bromodeoxyuridine in DAN; and N6-methyladenosine in RNA, with detection of other natural or synthetic epigenetic modifications possible through training basecalling algorithms One of the most widespread genomic modifications is 5-methylcytosine (5mC), which most frequently occurs at dinucleotides Compared to whole-genome bisulfite sequencing, the traditional method of 5mC detection, nanopore technology can offer many advantagesThe following cell lines/DNA samples were obtained from the NIGMS Human Genetic Cell Repository at the Coriell Institute for Medical Research: GM24385", + "ARN": "arn:aws:s3:::ont-open-data/gm24385_mod_2021.09/extra_analysis/bonito_remora", "Region": "eu-west-1", "Type": "S3 Bucket", "Documentation": "https://labs.epi2me.io/dataindex/", @@ -25829,8 +25829,8 @@ }, { "Name": "Oxford Nanopore Technologies Benchmark Datasets", - "Description": "Oxford Nanopore Open Datasets", - "ARN": "arn:aws:s3:::ont-open-data", + "Description": "Nanopore sequencing data of the Genome in a Bottle samples NA24385, NA24149, and NA24143 (HG002-HG004) using the LSK114 sequencing chemistry The direct sequencer output is included, raw signal data stored in fast5 files and basecalled data in fastq file Additional secondary analyses are included, notably alignments of sequence data to the reference genome and variant calls are provided along with statistics derived from theseThe following cell lines/DNA samples were obtained from the NIGMS Human Genetic Cell Repository at the Coriell Institute for Medical Research: NA24385, NA24149, and NA24143", + "ARN": "arn:aws:s3:::ont-open-data/giab_lsk114_2022.12", "Region": "eu-west-1", "Type": "S3 Bucket", "Documentation": "https://labs.epi2me.io/dataindex/", @@ -25857,8 +25857,8 @@ }, { "Name": "Oxford Nanopore Technologies Benchmark Datasets", - "Description": "Nanopore sequencing data of the Genome in a Bottle samples NA24385, NA24149, and NA24143 (HG002-HG004) using the LSK114 sequencing chemistry The direct sequencer output is included, raw signal data stored in fast5 files and basecalled data in fastq file Additional secondary analyses are included, notably alignments of sequence data to the reference genome and variant calls are provided along with statistics derived from theseThe following cell lines/DNA samples were obtained from the NIGMS Human Genetic Cell Repository at the Coriell Institute for Medical Research: NA24385, NA24149, and NA24143", - "ARN": "arn:aws:s3:::ont-open-data/giab_lsk114_2022.12", + "Description": "Oxford Nanopore Open Datasets", + "ARN": "arn:aws:s3:::ont-open-data", "Region": "eu-west-1", "Type": "S3 Bucket", "Documentation": "https://labs.epi2me.io/dataindex/", @@ -26105,8 +26105,8 @@ }, { "Name": "Pacific Ocean Sound Recordings", - "Description": "original 256 kHz audio recordings year 2018", - "ARN": "arn:aws:s3:::pacific-sound-256khz-2018", + "Description": "original 256 kHz audio recordings year 2015", + "ARN": "arn:aws:s3:::pacific-sound-256khz-2015", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://docs.mbari.org/pacific-sound/", @@ -26137,8 +26137,8 @@ }, { "Name": "Pacific Ocean Sound Recordings", - "Description": "decimated 16 kHz audio recordings", - "ARN": "arn:aws:s3:::pacific-sound-16khz", + "Description": "machine learning models", + "ARN": "arn:aws:s3:::pacific-sound-models", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://docs.mbari.org/pacific-sound/", @@ -26169,8 +26169,8 @@ }, { "Name": "Pacific Ocean Sound Recordings", - "Description": "original 256 kHz audio recordings year 2017", - "ARN": "arn:aws:s3:::pacific-sound-256khz-2017", + "Description": "decimated 16 kHz audio recordings", + "ARN": "arn:aws:s3:::pacific-sound-16khz", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://docs.mbari.org/pacific-sound/", @@ -26201,8 +26201,8 @@ }, { "Name": "Pacific Ocean Sound Recordings", - "Description": "original 256 kHz audio recordings year 2016", - "ARN": "arn:aws:s3:::pacific-sound-256khz-2016", + "Description": "decimated 2 kHz audio recordings", + "ARN": "arn:aws:s3:::pacific-sound-2khz", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://docs.mbari.org/pacific-sound/", @@ -26233,8 +26233,8 @@ }, { "Name": "Pacific Ocean Sound Recordings", - "Description": "original 256 kHz audio recordings year 2019", - "ARN": "arn:aws:s3:::pacific-sound-256khz-2019", + "Description": "original 256 kHz audio recordings year 2025", + "ARN": "arn:aws:s3:::pacific-sound-256khz-2025", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://docs.mbari.org/pacific-sound/", @@ -26265,8 +26265,8 @@ }, { "Name": "Pacific Ocean Sound Recordings", - "Description": "original 256 kHz audio recordings year 2020", - "ARN": "arn:aws:s3:::pacific-sound-256khz-2020", + "Description": "original 256 kHz audio recordings year 2023", + "ARN": "arn:aws:s3:::pacific-sound-256khz-2023", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://docs.mbari.org/pacific-sound/", @@ -26297,8 +26297,8 @@ }, { "Name": "Pacific Ocean Sound Recordings", - "Description": "decimated 2 kHz audio recordings", - "ARN": "arn:aws:s3:::pacific-sound-2khz", + "Description": "original 256 kHz audio recordings year 2022", + "ARN": "arn:aws:s3:::pacific-sound-256khz-2022", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://docs.mbari.org/pacific-sound/", @@ -26329,8 +26329,8 @@ }, { "Name": "Pacific Ocean Sound Recordings", - "Description": "original 256 kHz audio recordings year 2022", - "ARN": "arn:aws:s3:::pacific-sound-256khz-2022", + "Description": "original 256 kHz audio recordings year 2021", + "ARN": "arn:aws:s3:::pacific-sound-256khz-2021", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://docs.mbari.org/pacific-sound/", @@ -26361,8 +26361,8 @@ }, { "Name": "Pacific Ocean Sound Recordings", - "Description": "original 256 kHz audio recordings year 2023", - "ARN": "arn:aws:s3:::pacific-sound-256khz-2023", + "Description": "original 256 kHz audio recordings year 2020", + "ARN": "arn:aws:s3:::pacific-sound-256khz-2020", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://docs.mbari.org/pacific-sound/", @@ -26393,8 +26393,8 @@ }, { "Name": "Pacific Ocean Sound Recordings", - "Description": "original 256 kHz audio recordings year 2024", - "ARN": "arn:aws:s3:::pacific-sound-256khz-2024", + "Description": "original 256 kHz audio recordings year 2019", + "ARN": "arn:aws:s3:::pacific-sound-256khz-2019", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://docs.mbari.org/pacific-sound/", @@ -26425,8 +26425,8 @@ }, { "Name": "Pacific Ocean Sound Recordings", - "Description": "original 256 kHz audio recordings year 2025", - "ARN": "arn:aws:s3:::pacific-sound-256khz-2025", + "Description": "original 256 kHz audio recordings year 2018", + "ARN": "arn:aws:s3:::pacific-sound-256khz-2018", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://docs.mbari.org/pacific-sound/", @@ -26457,8 +26457,8 @@ }, { "Name": "Pacific Ocean Sound Recordings", - "Description": "machine learning models", - "ARN": "arn:aws:s3:::pacific-sound-models", + "Description": "original 256 kHz audio recordings year 2017", + "ARN": "arn:aws:s3:::pacific-sound-256khz-2017", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://docs.mbari.org/pacific-sound/", @@ -26489,8 +26489,8 @@ }, { "Name": "Pacific Ocean Sound Recordings", - "Description": "original 256 kHz audio recordings year 2021", - "ARN": "arn:aws:s3:::pacific-sound-256khz-2021", + "Description": "original 256 kHz audio recordings year 2016", + "ARN": "arn:aws:s3:::pacific-sound-256khz-2016", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://docs.mbari.org/pacific-sound/", @@ -26521,8 +26521,8 @@ }, { "Name": "Pacific Ocean Sound Recordings", - "Description": "original 256 kHz audio recordings year 2015", - "ARN": "arn:aws:s3:::pacific-sound-256khz-2015", + "Description": "original 256 kHz audio recordings year 2024", + "ARN": "arn:aws:s3:::pacific-sound-256khz-2024", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://docs.mbari.org/pacific-sound/", @@ -26574,8 +26574,8 @@ }, { "Name": "Pancreatic Cancer Organoid Profiling", - "Description": "RNA-Seq Gene Expression Quantification", - "ARN": "arn:aws:s3:::gdc-organoid-pancreatic-phs001611-2-open", + "Description": "WGS/WXS/RNA-Seq Aligned Reads, WXS Annotated Somatic Mutation, WXS Raw Somatic Mutation,RNA-Seq Splice Junction Quantification", + "ARN": "arn:aws:s3:::gdc-organoid-pancreatic-phs001611-2-controlled", "Region": "us-east-1", "Type": "S3 Bucket", "Documentation": "https://www.ncbi.nlm.nih.gov/projects/gap/cgi-bin/study.cgi?study_id=phs001611.v1.p1", @@ -26595,14 +26595,14 @@ ], "Explore": null, "RequesterPays": null, - "ControlledAccess": null, + "ControlledAccess": "https://www.ncbi.nlm.nih.gov/projects/gap/cgi-bin/study.cgi?study_id=phs001611.v1.p1", "AccountRequired": null, "Host": null }, { "Name": "Pancreatic Cancer Organoid Profiling", - "Description": "WGS/WXS/RNA-Seq Aligned Reads, WXS Annotated Somatic Mutation, WXS Raw Somatic Mutation,RNA-Seq Splice Junction Quantification", - "ARN": "arn:aws:s3:::gdc-organoid-pancreatic-phs001611-2-controlled", + "Description": "RNA-Seq Gene Expression Quantification", + "ARN": "arn:aws:s3:::gdc-organoid-pancreatic-phs001611-2-open", "Region": "us-east-1", "Type": "S3 Bucket", "Documentation": "https://www.ncbi.nlm.nih.gov/projects/gap/cgi-bin/study.cgi?study_id=phs001611.v1.p1", @@ -26622,7 +26622,7 @@ ], "Explore": null, "RequesterPays": null, - "ControlledAccess": "https://www.ncbi.nlm.nih.gov/projects/gap/cgi-bin/study.cgi?study_id=phs001611.v1.p1", + "ControlledAccess": null, "AccountRequired": null, "Host": null }, @@ -26772,8 +26772,8 @@ }, { "Name": "PoroTomo", - "Description": "PoroTomo Nodal Seismometer Field Notes and Metadata", - "ARN": "arn:aws:s3:::nrel-pds-porotomo/Nodal/nodal_metadata/", + "Description": "PoroTomo Datasets", + "ARN": "arn:aws:s3:::nrel-pds-porotomo/", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://github.com/openEDI/documentation/blob/master/PoroTomo/PoroTomo.md", @@ -26789,7 +26789,7 @@ "geospatial" ], "Explore": [ - "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo&prefix=Nodal%2Fnodal_metadata%2F)" + "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo)" ], "RequesterPays": null, "ControlledAccess": null, @@ -26798,8 +26798,8 @@ }, { "Name": "PoroTomo", - "Description": "PoroTomo Vertical Distributed Acoustic Sensing (DASV) Data in SEG-Y format", - "ARN": "arn:aws:s3:::nrel-pds-porotomo/DAS/SEG-Y/DASV/", + "Description": "PoroTomo Horizontal Distributed Acoustic Sensing (DASH) Data in SEG-Y format", + "ARN": "arn:aws:s3:::nrel-pds-porotomo/DAS/SEG-Y/DASH/", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://github.com/openEDI/documentation/blob/master/PoroTomo/PoroTomo.md", @@ -26815,7 +26815,7 @@ "geospatial" ], "Explore": [ - "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo&prefix=DAS%2FSEG-Y%2FDASV%2F)" + "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo&prefix=DAS%2FSEG-Y%2FDASH%2F)" ], "RequesterPays": null, "ControlledAccess": null, @@ -26824,8 +26824,8 @@ }, { "Name": "PoroTomo", - "Description": "PoroTomo Datasets", - "ARN": "arn:aws:s3:::nrel-pds-porotomo/", + "Description": "PoroTomo Horizontal Distributed Acoustic Sensing (DASH) Data Resampled in Time MATLAB Files", + "ARN": "arn:aws:s3:::nrel-pds-porotomo/DAS/SEG-Y/DASH/Resampled/", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://github.com/openEDI/documentation/blob/master/PoroTomo/PoroTomo.md", @@ -26841,7 +26841,7 @@ "geospatial" ], "Explore": [ - "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo)" + "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo&prefix=DAS%2FSEG-Y%2FDASH%2FResampled%2F)" ], "RequesterPays": null, "ControlledAccess": null, @@ -26850,8 +26850,8 @@ }, { "Name": "PoroTomo", - "Description": "PoroTomo Horizontal Distributed Acoustic Sensing (DASH) Data in HDF5 format", - "ARN": "arn:aws:s3:::nrel-pds-porotomo/DAS/H5/DASH/", + "Description": "PoroTomo Vertical Distributed Acoustic Sensing (DASV) Data in SEG-Y format", + "ARN": "arn:aws:s3:::nrel-pds-porotomo/DAS/SEG-Y/DASV/", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://github.com/openEDI/documentation/blob/master/PoroTomo/PoroTomo.md", @@ -26867,7 +26867,7 @@ "geospatial" ], "Explore": [ - "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo&prefix=DAS%2FH5%2FDASH%2F)" + "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo&prefix=DAS%2FSEG-Y%2FDASV%2F)" ], "RequesterPays": null, "ControlledAccess": null, @@ -26876,8 +26876,8 @@ }, { "Name": "PoroTomo", - "Description": "PoroTomo Horizontal Distributed Acoustic Sensing (DASH) Data Resampled in Time MATLAB Files", - "ARN": "arn:aws:s3:::nrel-pds-porotomo/DAS/SEG-Y/DASH/Resampled/", + "Description": "PoroTomo Horizontal Distributed Acoustic Sensing (DASH) Data in HDF5 format", + "ARN": "arn:aws:s3:::nrel-pds-porotomo/DAS/H5/DASH/", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://github.com/openEDI/documentation/blob/master/PoroTomo/PoroTomo.md", @@ -26893,7 +26893,7 @@ "geospatial" ], "Explore": [ - "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo&prefix=DAS%2FSEG-Y%2FDASH%2FResampled%2F)" + "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo&prefix=DAS%2FH5%2FDASH%2F)" ], "RequesterPays": null, "ControlledAccess": null, @@ -26954,8 +26954,8 @@ }, { "Name": "PoroTomo", - "Description": "PoroTomo Horizontal Distributed Acoustic Sensing (DASH) Data in SEG-Y format", - "ARN": "arn:aws:s3:::nrel-pds-porotomo/DAS/SEG-Y/DASH/", + "Description": "PoroTomo Nodal Seismometer Continuous Data", + "ARN": "arn:aws:s3:::nrel-pds-porotomo/Nodal/nodal_sac/", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://github.com/openEDI/documentation/blob/master/PoroTomo/PoroTomo.md", @@ -26971,7 +26971,7 @@ "geospatial" ], "Explore": [ - "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo&prefix=DAS%2FSEG-Y%2FDASH%2F)" + "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo&prefix=Nodal%2Fnodal_sac%2F)" ], "RequesterPays": null, "ControlledAccess": null, @@ -26980,8 +26980,8 @@ }, { "Name": "PoroTomo", - "Description": "PoroTomo Nodal Seismometer Continuous Data", - "ARN": "arn:aws:s3:::nrel-pds-porotomo/Nodal/nodal_sac/", + "Description": "PoroTomo Nodal Seismometer Field Notes and Metadata", + "ARN": "arn:aws:s3:::nrel-pds-porotomo/Nodal/nodal_metadata/", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://github.com/openEDI/documentation/blob/master/PoroTomo/PoroTomo.md", @@ -26997,7 +26997,7 @@ "geospatial" ], "Explore": [ - "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo&prefix=Nodal%2Fnodal_sac%2F)" + "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo&prefix=Nodal%2Fnodal_metadata%2F)" ], "RequesterPays": null, "ControlledAccess": null, @@ -27134,10 +27134,10 @@ }, { "Name": "Protein Data Bank 3D Structural Biology Data", - "Description": "Historical snapshots of archival datasets from 2005 onwards Snapshots are generated annually and at major milestone", - "ARN": "arn:aws:s3:::pdbsnapshots", + "Description": "Globally cached distribution of the dataset Web frontend also available to browse the dataset and file directory", + "ARN": null, "Region": "us-west-2", - "Type": "S3 Bucket", + "Type": "CloudFront Distribution", "Documentation": "https://www.wwpdb.org/documentation/file-format", "Contact": "https://www.wwpdb.org/about/contact", "ManagedBy": "[Worldwide Protein Data Bank Partnership](wwpdb.org)", @@ -27166,7 +27166,7 @@ "x-ray crystallography" ], "Explore": [ - "[Browse Bucket](https://pdbsnapshots.s3.us-west-2.amazonaws.com/index.html)" + "[Browse Dataset](https://s3.rcsb.org)" ], "RequesterPays": null, "ControlledAccess": null, @@ -27175,10 +27175,10 @@ }, { "Name": "Protein Data Bank 3D Structural Biology Data", - "Description": "Globally cached distribution of the dataset Web frontend also available to browse the dataset and file directory", - "ARN": null, + "Description": "Historical snapshots of archival datasets from 2005 onwards Snapshots are generated annually and at major milestone", + "ARN": "arn:aws:s3:::pdbsnapshots", "Region": "us-west-2", - "Type": "CloudFront Distribution", + "Type": "S3 Bucket", "Documentation": "https://www.wwpdb.org/documentation/file-format", "Contact": "https://www.wwpdb.org/about/contact", "ManagedBy": "[Worldwide Protein Data Bank Partnership](wwpdb.org)", @@ -27207,7 +27207,7 @@ "x-ray crystallography" ], "Explore": [ - "[Browse Dataset](https://s3.rcsb.org)" + "[Browse Bucket](https://pdbsnapshots.s3.us-west-2.amazonaws.com/index.html)" ], "RequesterPays": null, "ControlledAccess": null, @@ -27238,8 +27238,8 @@ }, { "Name": "PubSeq - Public Sequence Resource", - "Description": "Pubseq output data (Arvados Keep)", - "ARN": "arn:aws:s3:::pubseq-output-data", + "Description": "PubSeq submitted datasets (FASTA and JSON metadata)", + "ARN": "arn:aws:s3:::pubseq-datasets", "Region": "us-east-2", "Type": "S3 Bucket", "Documentation": "https://covid19.genenetwork.org/about", @@ -27273,7 +27273,7 @@ "SPARQL" ], "Explore": [ - "[Arvados download](https://covid19.genenetwork.org/download)" + "[Browse Bucket](https://pubseq-datasets.s3.amazonaws.com/)" ], "RequesterPays": null, "ControlledAccess": null, @@ -27282,8 +27282,8 @@ }, { "Name": "PubSeq - Public Sequence Resource", - "Description": "PubSeq submitted datasets (FASTA and JSON metadata)", - "ARN": "arn:aws:s3:::pubseq-datasets", + "Description": "Pubseq output data (Arvados Keep)", + "ARN": "arn:aws:s3:::pubseq-output-data", "Region": "us-east-2", "Type": "S3 Bucket", "Documentation": "https://covid19.genenetwork.org/about", @@ -27317,7 +27317,7 @@ "SPARQL" ], "Explore": [ - "[Browse Bucket](https://pubseq-datasets.s3.amazonaws.com/)" + "[Arvados download](https://covid19.genenetwork.org/download)" ], "RequesterPays": null, "ControlledAccess": null, @@ -27356,8 +27356,8 @@ }, { "Name": "PyEnvs and CallArgs", - "Description": "CallArgs", - "ARN": "arn:aws:s3:::pyenvs-and-callargs/callargs/", + "Description": "PyEnvs", + "ARN": "arn:aws:s3:::pyenvs-and-callargs/pyenvs/", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://github.com/amazon-research/function-call-argument-completion", @@ -27377,8 +27377,8 @@ }, { "Name": "PyEnvs and CallArgs", - "Description": "PyEnvs", - "ARN": "arn:aws:s3:::pyenvs-and-callargs/pyenvs/", + "Description": "CallArgs", + "ARN": "arn:aws:s3:::pyenvs-and-callargs/callargs/", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://github.com/amazon-research/function-call-argument-completion", @@ -28037,8 +28037,8 @@ }, { "Name": "SILAM Air Quality", - "Description": "Surface Zarr files", - "ARN": "arn:aws:s3:::fmi-opendata-silam-surface-zarr", + "Description": "Surface NetCDF files", + "ARN": "arn:aws:s3:::fmi-opendata-silam-surface-netcdf", "Region": "eu-west-1", "Type": "S3 Bucket", "Documentation": "http://en.ilmatieteenlaitos.fi/open-data-on-aws-s3", @@ -28055,7 +28055,7 @@ "meteorological" ], "Explore": [ - "[Browse Bucket](https://fmi-opendata-silam-surface-zarr.s3.amazonaws.com/index.html)" + "[Browse Bucket](https://fmi-opendata-silam-surface-netcdf.s3.amazonaws.com/index.html)" ], "RequesterPays": null, "ControlledAccess": null, @@ -28064,10 +28064,10 @@ }, { "Name": "SILAM Air Quality", - "Description": "Notifications for new zarr surface data", - "ARN": "arn:aws:sns:eu-west-1:916174725480:new-fmi-opendata-silam-surface-zarr", + "Description": "Surface Zarr files", + "ARN": "arn:aws:s3:::fmi-opendata-silam-surface-zarr", "Region": "eu-west-1", - "Type": "SNS Topic", + "Type": "S3 Bucket", "Documentation": "http://en.ilmatieteenlaitos.fi/open-data-on-aws-s3", "Contact": "avoin-data@fmi.fi", "ManagedBy": "[Finnish Meteorological Institute](https://www.ilmatieteenlaitos.fi/)", @@ -28081,7 +28081,9 @@ "air quality", "meteorological" ], - "Explore": null, + "Explore": [ + "[Browse Bucket](https://fmi-opendata-silam-surface-zarr.s3.amazonaws.com/index.html)" + ], "RequesterPays": null, "ControlledAccess": null, "AccountRequired": null, @@ -28114,10 +28116,10 @@ }, { "Name": "SILAM Air Quality", - "Description": "Surface NetCDF files", - "ARN": "arn:aws:s3:::fmi-opendata-silam-surface-netcdf", + "Description": "Notifications for new zarr surface data", + "ARN": "arn:aws:sns:eu-west-1:916174725480:new-fmi-opendata-silam-surface-zarr", "Region": "eu-west-1", - "Type": "S3 Bucket", + "Type": "SNS Topic", "Documentation": "http://en.ilmatieteenlaitos.fi/open-data-on-aws-s3", "Contact": "avoin-data@fmi.fi", "ManagedBy": "[Finnish Meteorological Institute](https://www.ilmatieteenlaitos.fi/)", @@ -28131,9 +28133,7 @@ "air quality", "meteorological" ], - "Explore": [ - "[Browse Bucket](https://fmi-opendata-silam-surface-netcdf.s3.amazonaws.com/index.html)" - ], + "Explore": null, "RequesterPays": null, "ControlledAccess": null, "AccountRequired": null, @@ -28413,6 +28413,36 @@ "AccountRequired": null, "Host": null }, + { + "Name": "Satellogic EarthView dataset", + "Description": "Satellogic data includes TOA RGBN COG, VISUAL RGB COG files data and metadata", + "ARN": "arn:aws:s3:::satellogic-earthview", + "Region": "us-west-2", + "Type": "S3 Bucket", + "Documentation": "https://satellogic-earthview.s3.us-west-2.amazonaws.com/index.html", + "Contact": "https://www.satellogic.com/", + "ManagedBy": "[Satellogic](https://www.satellogic.com)", + "UpdateFrequency": "New data will be made available periodically, with annual updates expected in the future covering the same or other new regions.", + "License": "[CC BY 4.0](https://creativecommons.org/licenses/by/4.0/deed.en)", + "Tags": [ + "aws-pds", + "satellite imagery", + "earth observation", + "image processing", + "geospatial", + "computer vision", + "stac", + "cog" + ], + "Explore": [ + "[STAC Catalog](https://satellogic-earthview.s3.us-west-2.amazonaws.com/stac/catalog.json)", + "[STAC Browser](https://radiantearth.github.io/stac-browser/#/external/satellogic-earthview.s3.us-west-2.amazonaws.com/stac/catalog.json)" + ], + "RequesterPays": false, + "ControlledAccess": null, + "AccountRequired": null, + "Host": null + }, { "Name": "Scottish Public Sector LiDAR Dataset", "Description": "LiDAR data (DSM, DTM and Laz)", @@ -28492,8 +28522,8 @@ }, { "Name": "Seattle Alzheimer's Disease Brain Cell Atlas (SEA-AD)", - "Description": "Spatial transcriptomics data files in a public bucket", - "ARN": "arn:aws:s3:::sea-ad-spatial-transcriptomics", + "Description": "Quantitative neuropathology (full resolution images, processed images, and quantifications) in a public bucket", + "ARN": "arn:aws:s3:::sea-ad-quantitative-neuropathology", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://portal.brain-map.org/explore/seattle-alzheimers-disease/seattle-alzheimers-disease-brain-cell-atlas-download?edit&language=en", @@ -28520,7 +28550,7 @@ "life sciences" ], "Explore": [ - "[Browse Bucket](https://sea-ad-spatial-transcriptomics.s3.amazonaws.com/index.html)" + "[Browse Bucket](https://sea-ad-quantitative-neuropathology.s3.amazonaws.com/index.html)" ], "RequesterPays": null, "ControlledAccess": null, @@ -28529,8 +28559,8 @@ }, { "Name": "Seattle Alzheimer's Disease Brain Cell Atlas (SEA-AD)", - "Description": "Quantitative neuropathology (full resolution images, processed images, and quantifications) in a public bucket", - "ARN": "arn:aws:s3:::sea-ad-quantitative-neuropathology", + "Description": "Single cell profiling (transcriptomics and epigenomics) data files in a public bucket", + "ARN": "arn:aws:s3:::sea-ad-single-cell-profiling", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://portal.brain-map.org/explore/seattle-alzheimers-disease/seattle-alzheimers-disease-brain-cell-atlas-download?edit&language=en", @@ -28557,7 +28587,7 @@ "life sciences" ], "Explore": [ - "[Browse Bucket](https://sea-ad-quantitative-neuropathology.s3.amazonaws.com/index.html)" + "[Browse Bucket](https://sea-ad-single-cell-profiling.s3.amazonaws.com/index.html)" ], "RequesterPays": null, "ControlledAccess": null, @@ -28566,8 +28596,8 @@ }, { "Name": "Seattle Alzheimer's Disease Brain Cell Atlas (SEA-AD)", - "Description": "Single cell profiling (transcriptomics and epigenomics) data files in a public bucket", - "ARN": "arn:aws:s3:::sea-ad-single-cell-profiling", + "Description": "Spatial transcriptomics data files in a public bucket", + "ARN": "arn:aws:s3:::sea-ad-spatial-transcriptomics", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://portal.brain-map.org/explore/seattle-alzheimers-disease/seattle-alzheimers-disease-brain-cell-atlas-download?edit&language=en", @@ -28594,7 +28624,7 @@ "life sciences" ], "Explore": [ - "[Browse Bucket](https://sea-ad-single-cell-profiling.s3.amazonaws.com/index.html)" + "[Browse Bucket](https://sea-ad-spatial-transcriptomics.s3.amazonaws.com/index.html)" ], "RequesterPays": null, "ControlledAccess": null, @@ -28857,10 +28887,10 @@ }, { "Name": "Sentinel-2", - "Description": "New scene notifications for L2A, can subscribe with Lambda", - "ARN": "arn:aws:sns:eu-central-1:214830741341:SentinelS2L2A", + "Description": "S3 Inventory files for L1C and CSV", + "ARN": "arn:aws:s3:::sentinel-inventory/sentinel-s2-l1c", "Region": "eu-central-1", - "Type": "SNS Topic", + "Type": "S3 Bucket", "Documentation": "Documentation is available for [Sentinel-2 L1C](https://roda.sentinel-hub.com/sentinel-s2-l1c/readme.html) and [Sentinel-2 L2A](https://roda.sentinel-hub.com/sentinel-s2-l2a/readme.html).", "Contact": "https://forum.sentinel-hub.com/c/aws-sentinel", "ManagedBy": "[Sinergise](https://www.sinergise.com/)", @@ -28911,8 +28941,8 @@ }, { "Name": "Sentinel-2", - "Description": "Zipped archives for each L2A product with 3 day retention period, in Requester Pays bucket", - "ARN": "arn:aws:s3:::sentinel-s2-l2a-zips", + "Description": "S3 Inventory files for L2A and CSV", + "ARN": "arn:aws:s3:::sentinel-inventory/sentinel-s2-l2a", "Region": "eu-central-1", "Type": "S3 Bucket", "Documentation": "Documentation is available for [Sentinel-2 L1C](https://roda.sentinel-hub.com/sentinel-s2-l1c/readme.html) and [Sentinel-2 L2A](https://roda.sentinel-hub.com/sentinel-s2-l2a/readme.html).", @@ -28931,7 +28961,7 @@ "stac" ], "Explore": null, - "RequesterPays": true, + "RequesterPays": null, "ControlledAccess": null, "AccountRequired": null, "Host": null @@ -28965,8 +28995,8 @@ }, { "Name": "Sentinel-2", - "Description": "S3 Inventory files for L2A and CSV", - "ARN": "arn:aws:s3:::sentinel-inventory/sentinel-s2-l2a", + "Description": "Zipped archives for each L2A product with 3 day retention period, in Requester Pays bucket", + "ARN": "arn:aws:s3:::sentinel-s2-l2a-zips", "Region": "eu-central-1", "Type": "S3 Bucket", "Documentation": "Documentation is available for [Sentinel-2 L1C](https://roda.sentinel-hub.com/sentinel-s2-l1c/readme.html) and [Sentinel-2 L2A](https://roda.sentinel-hub.com/sentinel-s2-l2a/readme.html).", @@ -28985,7 +29015,7 @@ "stac" ], "Explore": null, - "RequesterPays": null, + "RequesterPays": true, "ControlledAccess": null, "AccountRequired": null, "Host": null @@ -29021,8 +29051,8 @@ }, { "Name": "Sentinel-2", - "Description": "S3 Inventory files for L1C and CSV", - "ARN": "arn:aws:s3:::sentinel-inventory/sentinel-s2-l1c", + "Description": "Level 1C scenes and metadata, in Requester Pays S3 bucket", + "ARN": "arn:aws:s3:::sentinel-s2-l1c", "Region": "eu-central-1", "Type": "S3 Bucket", "Documentation": "Documentation is available for [Sentinel-2 L1C](https://roda.sentinel-hub.com/sentinel-s2-l1c/readme.html) and [Sentinel-2 L2A](https://roda.sentinel-hub.com/sentinel-s2-l2a/readme.html).", @@ -29040,18 +29070,23 @@ "disaster response", "stac" ], - "Explore": null, - "RequesterPays": null, + "Explore": [ + "[Earth Search STAC L1C Collection](https://earth-search.aws.element84.com/v1/collections/sentinel-2-l1c)", + "[Earth Search STAC Browser L1C Collection](https://radiantearth.github.io/stac-browser/#/external/earth-search.aws.element84.com/v1/collections/sentinel-2-l1c)", + "[STAC V1.0.0 endpoint](https://sentinel-s2-l1c-stac.s3.amazonaws.com/)", + "[Earth Viewer by Element 84](https://viewer.aws.element84.com/)" + ], + "RequesterPays": true, "ControlledAccess": null, "AccountRequired": null, "Host": null }, { "Name": "Sentinel-2", - "Description": "Level 1C scenes and metadata, in Requester Pays S3 bucket", - "ARN": "arn:aws:s3:::sentinel-s2-l1c", + "Description": "New scene notifications for L2A, can subscribe with Lambda", + "ARN": "arn:aws:sns:eu-central-1:214830741341:SentinelS2L2A", "Region": "eu-central-1", - "Type": "S3 Bucket", + "Type": "SNS Topic", "Documentation": "Documentation is available for [Sentinel-2 L1C](https://roda.sentinel-hub.com/sentinel-s2-l1c/readme.html) and [Sentinel-2 L2A](https://roda.sentinel-hub.com/sentinel-s2-l2a/readme.html).", "Contact": "https://forum.sentinel-hub.com/c/aws-sentinel", "ManagedBy": "[Sinergise](https://www.sinergise.com/)", @@ -29067,13 +29102,8 @@ "disaster response", "stac" ], - "Explore": [ - "[Earth Search STAC L1C Collection](https://earth-search.aws.element84.com/v1/collections/sentinel-2-l1c)", - "[Earth Search STAC Browser L1C Collection](https://radiantearth.github.io/stac-browser/#/external/earth-search.aws.element84.com/v1/collections/sentinel-2-l1c)", - "[STAC V1.0.0 endpoint](https://sentinel-s2-l1c-stac.s3.amazonaws.com/)", - "[Earth Viewer by Element 84](https://viewer.aws.element84.com/)" - ], - "RequesterPays": true, + "Explore": null, + "RequesterPays": null, "ControlledAccess": null, "AccountRequired": null, "Host": null @@ -29160,8 +29190,8 @@ }, { "Name": "Sentinel-2 Cloud-Optimized GeoTIFFs", - "Description": "S3 Inventory files for L1C and CSV", - "ARN": "arn:aws:s3:::sentinel-cogs-inventory", + "Description": "Level 2A scenes and metadata", + "ARN": "arn:aws:s3:::sentinel-cogs", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://github.com/cirrus-geo/cirrus-earth-search", @@ -29180,16 +29210,19 @@ "cog", "stac" ], - "Explore": null, - "RequesterPays": null, + "Explore": [ + "[Earth Search STAC L2A Collection](https://earth-search.aws.element84.com/v1/collections/sentinel-2-l2a)", + "[STAC Browser L2A Collection](https://radiantearth.github.io/stac-browser/#/external/earth-search.aws.element84.com/v1/collections/sentinel-2-l2a)" + ], + "RequesterPays": false, "ControlledAccess": null, "AccountRequired": null, "Host": null }, { "Name": "Sentinel-2 Cloud-Optimized GeoTIFFs", - "Description": "Level 2A scenes and metadata", - "ARN": "arn:aws:s3:::sentinel-cogs", + "Description": "S3 Inventory files for L1C and CSV", + "ARN": "arn:aws:s3:::sentinel-cogs-inventory", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://github.com/cirrus-geo/cirrus-earth-search", @@ -29208,11 +29241,8 @@ "cog", "stac" ], - "Explore": [ - "[Earth Search STAC L2A Collection](https://earth-search.aws.element84.com/v1/collections/sentinel-2-l2a)", - "[STAC Browser L2A Collection](https://radiantearth.github.io/stac-browser/#/external/earth-search.aws.element84.com/v1/collections/sentinel-2-l2a)" - ], - "RequesterPays": false, + "Explore": null, + "RequesterPays": null, "ControlledAccess": null, "AccountRequired": null, "Host": null @@ -29246,8 +29276,8 @@ }, { "Name": "Sentinel-3", - "Description": "Sentinel-3 Near Real Time Data (NRT) format", - "ARN": "arn:aws:s3:::meeo-s3/NRT/", + "Description": "Sentinel-3 Short Time Critical (STC) format", + "ARN": "arn:aws:s3:::meeo-s3/STC/", "Region": "eu-central-1", "Type": "S3 Bucket", "Documentation": "https://github.com/Sentinel-5P/data-on-s3/blob/master/DocsForAws/Sentinel3Description.md", @@ -29302,8 +29332,8 @@ }, { "Name": "Sentinel-3", - "Description": "Sentinel-3 Short Time Critical (STC) format", - "ARN": "arn:aws:s3:::meeo-s3/STC/", + "Description": "Sentinel-3 Near Real Time Data (NRT) format", + "ARN": "arn:aws:s3:::meeo-s3/NRT/", "Region": "eu-central-1", "Type": "S3 Bucket", "Documentation": "https://github.com/Sentinel-5P/data-on-s3/blob/master/DocsForAws/Sentinel3Description.md", @@ -29763,8 +29793,8 @@ }, { "Name": "Software Heritage Graph Dataset", - "Description": "S3 Inventory files", - "ARN": "arn:aws:s3:::softwareheritage-inventory", + "Description": "Software Heritage Graph Dataset", + "ARN": "arn:aws:s3:::softwareheritage", "Region": "us-east-1", "Type": "S3 Bucket", "Documentation": "https://docs.softwareheritage.org/devel/swh-dataset/graph/athena.html", @@ -29787,8 +29817,8 @@ }, { "Name": "Software Heritage Graph Dataset", - "Description": "Software Heritage Graph Dataset", - "ARN": "arn:aws:s3:::softwareheritage", + "Description": "S3 Inventory files", + "ARN": "arn:aws:s3:::softwareheritage-inventory", "Region": "us-east-1", "Type": "S3 Bucket", "Documentation": "https://docs.softwareheritage.org/devel/swh-dataset/graph/athena.html", @@ -30138,8 +30168,8 @@ }, { "Name": "Sup3rCC", - "Description": "Sup3rCC Generative Models", - "ARN": "arn:aws:s3:::nrel-pds-sup3rcc/models/", + "Description": "Sup3rCC - CONUS - MRI ESM 20 - SSP585 - r1i1p1f1", + "ARN": "arn:aws:s3:::nrel-pds-sup3rcc/conus_mriesm20_ssp585_r1i1p1f1/", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://github.com/NREL/sup3r", @@ -30155,7 +30185,7 @@ "climate model" ], "Explore": [ - "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-sup3rcc&prefix=models%2F)" + "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-sup3rcc&prefix=conus_mriesm20_ssp585_r1i1p1f1%2F)" ], "RequesterPays": null, "ControlledAccess": null, @@ -30164,8 +30194,8 @@ }, { "Name": "Sup3rCC", - "Description": "Sup3rCC - CONUS - MRI ESM 20 - SSP585 - r1i1p1f1", - "ARN": "arn:aws:s3:::nrel-pds-sup3rcc/conus_mriesm20_ssp585_r1i1p1f1/", + "Description": "Sup3rCC Generative Models", + "ARN": "arn:aws:s3:::nrel-pds-sup3rcc/models/", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://github.com/NREL/sup3r", @@ -30181,7 +30211,7 @@ "climate model" ], "Explore": [ - "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-sup3rcc&prefix=conus_mriesm20_ssp585_r1i1p1f1%2F)" + "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-sup3rcc&prefix=models%2F)" ], "RequesterPays": null, "ControlledAccess": null, @@ -30899,10 +30929,10 @@ }, { "Name": "Transiting Exoplanet Survey Satellite (TESS)", - "Description": "TESS Mission data files", - "ARN": "arn:aws:s3:::stpubdata/tess", + "Description": "Notifications for new data", + "ARN": "arn:aws:sns:us-east-1:879230861493:stpubdata/tess", "Region": "us-east-1", - "Type": "S3 Bucket", + "Type": "SNS Topic", "Documentation": "https://archive.stsci.edu/missions-and-data/tess", "Contact": "archive@stsci.edu", "ManagedBy": "[Space Telescope Science Institute](http://www.stsci.edu/)", @@ -30913,17 +30943,17 @@ "aws-pds" ], "Explore": null, - "RequesterPays": false, + "RequesterPays": null, "ControlledAccess": null, "AccountRequired": null, "Host": null }, { "Name": "Transiting Exoplanet Survey Satellite (TESS)", - "Description": "Notifications for new data", - "ARN": "arn:aws:sns:us-east-1:879230861493:stpubdata/tess", + "Description": "TESS Mission data files", + "ARN": "arn:aws:s3:::stpubdata/tess", "Region": "us-east-1", - "Type": "SNS Topic", + "Type": "S3 Bucket", "Documentation": "https://archive.stsci.edu/missions-and-data/tess", "Contact": "archive@stsci.edu", "ManagedBy": "[Space Telescope Science Institute](http://www.stsci.edu/)", @@ -30934,7 +30964,7 @@ "aws-pds" ], "Explore": null, - "RequesterPays": null, + "RequesterPays": false, "ControlledAccess": null, "AccountRequired": null, "Host": null @@ -31362,8 +31392,8 @@ }, { "Name": "UniProt", - "Description": "UniProt 2024_02", - "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2024-02/", + "Description": "UniProt 2021_03", + "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2021-03/", "Region": "eu-west-3", "Type": "S3 Bucket", "Documentation": "https://www.uniprot.org/help/about", @@ -31392,8 +31422,8 @@ }, { "Name": "UniProt", - "Description": "UniProt 2024_03", - "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2024-03/", + "Description": "UniProt 2021_01", + "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2021-01/", "Region": "eu-west-3", "Type": "S3 Bucket", "Documentation": "https://www.uniprot.org/help/about", @@ -31422,8 +31452,8 @@ }, { "Name": "UniProt", - "Description": "UniProt 2024_05", - "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2024-05/", + "Description": "UniProt 2021_02", + "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2021-02/", "Region": "eu-west-3", "Type": "S3 Bucket", "Documentation": "https://www.uniprot.org/help/about", @@ -31452,8 +31482,8 @@ }, { "Name": "UniProt", - "Description": "UniProt 2021_01", - "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2021-01/", + "Description": "UniProt 2021_04", + "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2021-04/", "Region": "eu-west-3", "Type": "S3 Bucket", "Documentation": "https://www.uniprot.org/help/about", @@ -31482,8 +31512,8 @@ }, { "Name": "UniProt", - "Description": "UniProt 2021_02", - "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2021-02/", + "Description": "UniProt 2022_02", + "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2022-02/", "Region": "eu-west-3", "Type": "S3 Bucket", "Documentation": "https://www.uniprot.org/help/about", @@ -31512,8 +31542,8 @@ }, { "Name": "UniProt", - "Description": "UniProt 2021_03", - "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2021-03/", + "Description": "UniProt 2022_03", + "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2022-03/", "Region": "eu-west-3", "Type": "S3 Bucket", "Documentation": "https://www.uniprot.org/help/about", @@ -31542,8 +31572,8 @@ }, { "Name": "UniProt", - "Description": "UniProt 2021_04", - "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2021-04/", + "Description": "UniProt 2022_01", + "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2022-01/", "Region": "eu-west-3", "Type": "S3 Bucket", "Documentation": "https://www.uniprot.org/help/about", @@ -31572,8 +31602,8 @@ }, { "Name": "UniProt", - "Description": "UniProt 2022_01", - "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2022-01/", + "Description": "UniProt 2022_05", + "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2022-05/", "Region": "eu-west-3", "Type": "S3 Bucket", "Documentation": "https://www.uniprot.org/help/about", @@ -31602,8 +31632,8 @@ }, { "Name": "UniProt", - "Description": "UniProt 2022_03", - "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2022-03/", + "Description": "UniProt 2024_05", + "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2024-05/", "Region": "eu-west-3", "Type": "S3 Bucket", "Documentation": "https://www.uniprot.org/help/about", @@ -31632,8 +31662,8 @@ }, { "Name": "UniProt", - "Description": "UniProt 2023_05", - "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2023-05/", + "Description": "UniProt 2024_03", + "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2024-03/", "Region": "eu-west-3", "Type": "S3 Bucket", "Documentation": "https://www.uniprot.org/help/about", @@ -31662,8 +31692,8 @@ }, { "Name": "UniProt", - "Description": "UniProt 2022_04", - "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2022-04/", + "Description": "UniProt 2024_02", + "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2024-02/", "Region": "eu-west-3", "Type": "S3 Bucket", "Documentation": "https://www.uniprot.org/help/about", @@ -31692,8 +31722,8 @@ }, { "Name": "UniProt", - "Description": "UniProt 2022_05", - "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2022-05/", + "Description": "UniProt 2022_04", + "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2022-04/", "Region": "eu-west-3", "Type": "S3 Bucket", "Documentation": "https://www.uniprot.org/help/about", @@ -31722,8 +31752,8 @@ }, { "Name": "UniProt", - "Description": "UniProt 2023_01", - "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2023-01/", + "Description": "UniProt 2023_05", + "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2023-05/", "Region": "eu-west-3", "Type": "S3 Bucket", "Documentation": "https://www.uniprot.org/help/about", @@ -31752,8 +31782,8 @@ }, { "Name": "UniProt", - "Description": "UniProt 2023_02", - "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2023-02/", + "Description": "UniProt 2024_01", + "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2024-01/", "Region": "eu-west-3", "Type": "S3 Bucket", "Documentation": "https://www.uniprot.org/help/about", @@ -31812,8 +31842,8 @@ }, { "Name": "UniProt", - "Description": "UniProt 2023_04", - "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2023-04/", + "Description": "UniProt 2023_02", + "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2023-02/", "Region": "eu-west-3", "Type": "S3 Bucket", "Documentation": "https://www.uniprot.org/help/about", @@ -31842,8 +31872,8 @@ }, { "Name": "UniProt", - "Description": "UniProt 2022_02", - "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2022-02/", + "Description": "UniProt 2023_01", + "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2023-01/", "Region": "eu-west-3", "Type": "S3 Bucket", "Documentation": "https://www.uniprot.org/help/about", @@ -31872,8 +31902,8 @@ }, { "Name": "UniProt", - "Description": "UniProt 2024_01", - "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2024-01/", + "Description": "UniProt 2023_04", + "ARN": "arn:aws:s3:::aws-open-data-uniprot-rdf/2023-04/", "Region": "eu-west-3", "Type": "S3 Bucket", "Documentation": "https://www.uniprot.org/help/about", @@ -32022,8 +32052,8 @@ }, { "Name": "Vermont Open Geospatial on AWS", - "Description": "Imagery datsets are organized in this bucket as statewide file mosaics and by acquisition year (often a portion of the state in any given year) These data are available in Cloud Optimized GeoTIFF (COG) format and use the following naming convention; 1) Statewide - STATEWIDE__cm__<#BANDS>Band, 2) By Acquisition Year - _cm__<#BANDS>Band Individual tiles are also available as lossless COGs under the /_Tiles subfolder", - "ARN": "arn:aws:s3:::vtopendata-prd/Imagery", + "Description": "Landcover datsets are organized in this bucket as statewide file mosaics These data are available in Cloud Optimized GeoTIFF (COG) format and use the following naming convention STATEWIDE__cm_LANDCOVER_", + "ARN": "arn:aws:s3:::vtopendata-prd/Landcover", "Region": "us-east-2", "Type": "S3 Bucket", "Documentation": "https://vcgi.vermont.gov/data-and-programs/", @@ -32047,8 +32077,8 @@ }, { "Name": "Vermont Open Geospatial on AWS", - "Description": "Landcover datsets are organized in this bucket as statewide file mosaics These data are available in Cloud Optimized GeoTIFF (COG) format and use the following naming convention STATEWIDE__cm_LANDCOVER_", - "ARN": "arn:aws:s3:::vtopendata-prd/Landcover", + "Description": "Imagery datsets are organized in this bucket as statewide file mosaics and by acquisition year (often a portion of the state in any given year) These data are available in Cloud Optimized GeoTIFF (COG) format and use the following naming convention; 1) Statewide - STATEWIDE__cm__<#BANDS>Band, 2) By Acquisition Year - _cm__<#BANDS>Band Individual tiles are also available as lossless COGs under the /_Tiles subfolder", + "ARN": "arn:aws:s3:::vtopendata-prd/Imagery", "Region": "us-east-2", "Type": "S3 Bucket", "Documentation": "https://vcgi.vermont.gov/data-and-programs/", @@ -32410,8 +32440,8 @@ }, { "Name": "Wind AI Bench", - "Description": "Wind AI Bench Airfoil Computational Fluid Dynamics (CFD) - 9k Shapes Data Sets", - "ARN": "arn:aws:s3:::nrel-pds-windai/aerodynamic_shapes/2D/9K_airfoils/", + "Description": "Wind AI Bench Airfoil Computational Fluid Dynamics (CFD) - 2k Shapes Data Sets", + "ARN": "arn:aws:s3:::nrel-pds-windai/aerodynamic_shapes/2D/2K_airfoils/", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://github.com/NREL/windAI_bench", @@ -32426,7 +32456,7 @@ "machine learning" ], "Explore": [ - "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-windai&prefix=aerodynamic_shapes%2F2D%2F9k_airfoils%2F)" + "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-windai&prefix=aerodynamic_shapes%2F2D%2F2k_airfoils%2F)" ], "RequesterPays": null, "ControlledAccess": null, @@ -32435,8 +32465,8 @@ }, { "Name": "Wind AI Bench", - "Description": "Wind AI Bench Airfoil Computational Fluid Dynamics (CFD) - 2k Shapes Data Sets", - "ARN": "arn:aws:s3:::nrel-pds-windai/aerodynamic_shapes/2D/2K_airfoils/", + "Description": "Wind AI Bench Airfoil Computational Fluid Dynamics (CFD) - 9k Shapes Data Sets", + "ARN": "arn:aws:s3:::nrel-pds-windai/aerodynamic_shapes/2D/9K_airfoils/", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://github.com/NREL/windAI_bench", @@ -32451,7 +32481,7 @@ "machine learning" ], "Explore": [ - "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-windai&prefix=aerodynamic_shapes%2F2D%2F2k_airfoils%2F)" + "[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-windai&prefix=aerodynamic_shapes%2F2D%2F9k_airfoils%2F)" ], "RequesterPays": null, "ControlledAccess": null, @@ -32590,8 +32620,8 @@ }, { "Name": "YouTube 8 Million - Data Lakehouse Ready", - "Description": "Original YT8M *tfrecords File structure info can be found here", - "ARN": "arn:aws:s3:::aws-roda-ml-datalake/yt8m/", + "Description": "Lakehouse ready YT8M as Glue Parquet files Install instructions here", + "ARN": "arn:aws:s3:::aws-roda-ml-datalake/yt8m_ods/", "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://github.com/aws-samples/data-lake-as-code/blob/roda-ml/docs/roda_install.md", @@ -32615,9 +32645,9 @@ }, { "Name": "YouTube 8 Million - Data Lakehouse Ready", - "Description": "Lakehouse ready YT8M as Glue Parquet files Install instructions here", - "ARN": "arn:aws:s3:::aws-roda-ml-datalake/yt8m_ods/", - "Region": "us-west-2", + "Description": "Replica of the two locations above in us-east-1", + "ARN": "arn:aws:s3:::aws-roda-ml-datalake-us-east-1/", + "Region": "us-east-1", "Type": "S3 Bucket", "Documentation": "https://github.com/aws-samples/data-lake-as-code/blob/roda-ml/docs/roda_install.md", "Contact": "https://github.com/aws-samples/data-lake-as-code/issues", @@ -32640,9 +32670,9 @@ }, { "Name": "YouTube 8 Million - Data Lakehouse Ready", - "Description": "Replica of the two locations above in us-east-1", - "ARN": "arn:aws:s3:::aws-roda-ml-datalake-us-east-1/", - "Region": "us-east-1", + "Description": "Original YT8M *tfrecords File structure info can be found here", + "ARN": "arn:aws:s3:::aws-roda-ml-datalake/yt8m/", + "Region": "us-west-2", "Type": "S3 Bucket", "Documentation": "https://github.com/aws-samples/data-lake-as-code/blob/roda-ml/docs/roda_install.md", "Contact": "https://github.com/aws-samples/data-lake-as-code/issues", @@ -32740,8 +32770,8 @@ }, { "Name": "iHART Whole Genome Sequencing Data Set", - "Description": "Cram, gVCF, and VCF files from The iHART whole genome sequencing study, Phase I+II, GRCh38", - "ARN": "arn:aws:s3:::ihart-hg38", + "Description": "gVCF and VCF files from The iHART whole genome sequencing study, control data sets", + "ARN": "arn:aws:s3:::ihart-psp", "Region": "us-east-1", "Type": "S3 Bucket", "Documentation": "http://www.ihart.org/data", @@ -32767,8 +32797,8 @@ }, { "Name": "iHART Whole Genome Sequencing Data Set", - "Description": "BAM, gVCF, and VCF files from The iHART whole genome sequencing study, Phase II", - "ARN": "arn:aws:s3:::ihart-main", + "Description": "Cram, gVCF, and VCF files from The iHART whole genome sequencing study, Phase I+II, GRCh38", + "ARN": "arn:aws:s3:::ihart-hg38", "Region": "us-east-1", "Type": "S3 Bucket", "Documentation": "http://www.ihart.org/data", @@ -32794,8 +32824,8 @@ }, { "Name": "iHART Whole Genome Sequencing Data Set", - "Description": "BAM, gVCF, and VCF files from The iHART whole genome sequencing study, Phase I", - "ARN": "arn:aws:s3:::ihart-release", + "Description": "BAM, gVCF, and VCF files from The iHART whole genome sequencing study, Phase II", + "ARN": "arn:aws:s3:::ihart-main", "Region": "us-east-1", "Type": "S3 Bucket", "Documentation": "http://www.ihart.org/data", @@ -32821,8 +32851,8 @@ }, { "Name": "iHART Whole Genome Sequencing Data Set", - "Description": "gVCF and VCF files from The iHART whole genome sequencing study, control data sets", - "ARN": "arn:aws:s3:::ihart-psp", + "Description": "BAM, gVCF, and VCF files from The iHART whole genome sequencing study, Phase I", + "ARN": "arn:aws:s3:::ihart-release", "Region": "us-east-1", "Type": "S3 Bucket", "Documentation": "http://www.ihart.org/data", @@ -32924,10 +32954,10 @@ }, { "Name": "nuPlan", - "Description": "nuPlan Dataset", - "ARN": "arn:aws:s3:::motional-nuplan", + "Description": "Globally cached distribution of the nuPlan Dataset Web frontend is available to browse the dataset", + "ARN": null, "Region": "ap-northeast-1", - "Type": "S3 Bucket", + "Type": "CloudFront Distribution", "Documentation": "https://nuplan.org", "Contact": "https://nuplan.org", "ManagedBy": "[Motional, Inc.](https://motional.com)", @@ -32941,20 +32971,18 @@ "transportation", "urban" ], - "Explore": [ - "[Browse Bucket](https://motional-nuplan.s3.ap-northeast-1.amazonaws.com/index.html)" - ], + "Explore": null, "RequesterPays": null, "ControlledAccess": null, "AccountRequired": null, - "Host": null + "Host": "https://d1qinkmu0ju04f.cloudfront.net" }, { "Name": "nuPlan", - "Description": "Globally cached distribution of the nuPlan Dataset Web frontend is available to browse the dataset", - "ARN": null, + "Description": "nuPlan Dataset", + "ARN": "arn:aws:s3:::motional-nuplan", "Region": "ap-northeast-1", - "Type": "CloudFront Distribution", + "Type": "S3 Bucket", "Documentation": "https://nuplan.org", "Contact": "https://nuplan.org", "ManagedBy": "[Motional, Inc.](https://motional.com)", @@ -32968,18 +32996,20 @@ "transportation", "urban" ], - "Explore": null, + "Explore": [ + "[Browse Bucket](https://motional-nuplan.s3.ap-northeast-1.amazonaws.com/index.html)" + ], "RequesterPays": null, "ControlledAccess": null, "AccountRequired": null, - "Host": "https://d1qinkmu0ju04f.cloudfront.net" + "Host": null }, { "Name": "nuScenes", - "Description": "nuScenes Dataset", - "ARN": "arn:aws:s3:::motional-nuscenes", + "Description": "Globally cached distribution of the nuScenes Dataset Web frontend is available to browse the dataset", + "ARN": null, "Region": "ap-northeast-1", - "Type": "S3 Bucket", + "Type": "CloudFront Distribution", "Documentation": "https://www.nuscenes.org", "Contact": "https://www.nuscenes.org", "ManagedBy": "[Motional, Inc.](https://motional.com)", @@ -32994,20 +33024,18 @@ "transportation", "urban" ], - "Explore": [ - "[Browse Bucket](https://motional-nuscenes.s3.ap-northeast-1.amazonaws.com/index.html)" - ], + "Explore": null, "RequesterPays": null, "ControlledAccess": null, "AccountRequired": null, - "Host": null + "Host": "https://d36yt3mvayqw5m.cloudfront.net" }, { "Name": "nuScenes", - "Description": "Globally cached distribution of the nuScenes Dataset Web frontend is available to browse the dataset", - "ARN": null, + "Description": "nuScenes Dataset", + "ARN": "arn:aws:s3:::motional-nuscenes", "Region": "ap-northeast-1", - "Type": "CloudFront Distribution", + "Type": "S3 Bucket", "Documentation": "https://www.nuscenes.org", "Contact": "https://www.nuscenes.org", "ManagedBy": "[Motional, Inc.](https://motional.com)", @@ -33022,18 +33050,20 @@ "transportation", "urban" ], - "Explore": null, + "Explore": [ + "[Browse Bucket](https://motional-nuscenes.s3.ap-northeast-1.amazonaws.com/index.html)" + ], "RequesterPays": null, "ControlledAccess": null, "AccountRequired": null, - "Host": "https://d36yt3mvayqw5m.cloudfront.net" + "Host": null }, { "Name": "real-changesets", - "Description": "New File Notification", - "ARN": "arn:aws:sns:us-west-2:877446169145:real-changesets-object_created", + "Description": "real-changesets", + "ARN": "arn:aws:s3:::real-changesets", "Region": "us-west-2", - "Type": "SNS Topic", + "Type": "S3 Bucket", "Documentation": "https://github.com/osmus/osmcha-charter-project/blob/main/real-changesets-docs.md", "Contact": "team@openstreetmap.us", "ManagedBy": "OpenStreetMap US", @@ -33054,10 +33084,10 @@ }, { "Name": "real-changesets", - "Description": "real-changesets", - "ARN": "arn:aws:s3:::real-changesets", + "Description": "New File Notification", + "ARN": "arn:aws:sns:us-west-2:877446169145:real-changesets-object_created", "Region": "us-west-2", - "Type": "S3 Bucket", + "Type": "SNS Topic", "Documentation": "https://github.com/osmus/osmcha-charter-project/blob/main/real-changesets-docs.md", "Contact": "team@openstreetmap.us", "ManagedBy": "OpenStreetMap US", diff --git a/aws_open_datasets.tsv b/aws_open_datasets.tsv index 834d5cf..dc376ca 100644 --- a/aws_open_datasets.tsv +++ b/aws_open_datasets.tsv @@ -619,9 +619,9 @@ NOAA Analysis of Record for Calibration (AORC) Dataset 1-km resolution AORC vers NOAA Atmospheric Climate Data Records Solar Spectral Irradiance arn:aws:s3:::noaa-cdr-solar-spectral-irradiance-pds us-east-1 S3 Bucket https://www.ncei.noaa.gov/products/climate-data-records/atmospheric For questions regarding the specific CDR data holdings, please contact NCEI.SAT. [NOAA](http://www.noaa.gov/) Climate Data Records are updated independently. For update frequency for a speci Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, sustainability, weather ['[Browse Bucket](https://noaa-cdr-solar-spectral-irradiance-pds.s3.amazonaws.com/index.html)'] NOAA Atmospheric Climate Data Records Total Solar Irradiance arn:aws:s3:::noaa-cdr-total-solar-irradiance-pds us-east-1 S3 Bucket https://www.ncei.noaa.gov/products/climate-data-records/atmospheric For questions regarding the specific CDR data holdings, please contact NCEI.SAT. [NOAA](http://www.noaa.gov/) Climate Data Records are updated independently. For update frequency for a speci Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, sustainability, weather ['[Browse Bucket](https://noaa-cdr-total-solar-irradiance-pds.s3.amazonaws.com/index.html)'] NOAA Atmospheric Climate Data Records PERSIANN Precip arn:aws:s3:::noaa-cdr-precip-persiann-pds us-east-1 S3 Bucket https://www.ncei.noaa.gov/products/climate-data-records/atmospheric For questions regarding the specific CDR data holdings, please contact NCEI.SAT. [NOAA](http://www.noaa.gov/) Climate Data Records are updated independently. For update frequency for a speci Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, sustainability, weather ['[Browse Bucket](https://noaa-cdr-precip-persiann-pds.s3.amazonaws.com/index.html)'] -NOAA Atmospheric Climate Data Records Cloud Properties Polar Orbiter arn:aws:s3:::noaa-cdr-cloud-properties-polar-orbiter-nasa-pds us-east-1 S3 Bucket https://www.ncei.noaa.gov/products/climate-data-records/atmospheric For questions regarding the specific CDR data holdings, please contact NCEI.SAT. [NOAA](http://www.noaa.gov/) Climate Data Records are updated independently. For update frequency for a speci Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, sustainability, weather ['[Browse Bucket](https://noaa-cdr-cloud-properties-polar-orbiter-nasa-pds.s3.amazonaws.com/index.html)'] -NOAA Atmospheric Climate Data Records GPCP Precip Monthly arn:aws:s3:::noaa-cdr-precip-gpcp-monthly-pds us-east-1 S3 Bucket https://www.ncei.noaa.gov/products/climate-data-records/atmospheric For questions regarding the specific CDR data holdings, please contact NCEI.SAT. [NOAA](http://www.noaa.gov/) Climate Data Records are updated independently. For update frequency for a speci Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, sustainability, weather ['[Browse Bucket](https://noaa-cdr-precip-gpcp-monthly-pds.s3.amazonaws.com/index.html)'] NOAA Atmospheric Climate Data Records Hydrological Properties arn:aws:s3:::noaa-cdr-hydrological-properties-pds us-east-1 S3 Bucket https://www.ncei.noaa.gov/products/climate-data-records/atmospheric For questions regarding the specific CDR data holdings, please contact NCEI.SAT. [NOAA](http://www.noaa.gov/) Climate Data Records are updated independently. For update frequency for a speci Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, sustainability, weather ['[Browse Bucket](https://noaa-cdr-hydrological-properties-pds.s3.amazonaws.com/index.html)'] +NOAA Atmospheric Climate Data Records GPCP Precip Monthly arn:aws:s3:::noaa-cdr-precip-gpcp-monthly-pds us-east-1 S3 Bucket https://www.ncei.noaa.gov/products/climate-data-records/atmospheric For questions regarding the specific CDR data holdings, please contact NCEI.SAT. [NOAA](http://www.noaa.gov/) Climate Data Records are updated independently. For update frequency for a speci Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, sustainability, weather ['[Browse Bucket](https://noaa-cdr-precip-gpcp-monthly-pds.s3.amazonaws.com/index.html)'] +NOAA Atmospheric Climate Data Records Cloud Properties Polar Orbiter arn:aws:s3:::noaa-cdr-cloud-properties-polar-orbiter-nasa-pds us-east-1 S3 Bucket https://www.ncei.noaa.gov/products/climate-data-records/atmospheric For questions regarding the specific CDR data holdings, please contact NCEI.SAT. [NOAA](http://www.noaa.gov/) Climate Data Records are updated independently. For update frequency for a speci Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, sustainability, weather ['[Browse Bucket](https://noaa-cdr-cloud-properties-polar-orbiter-nasa-pds.s3.amazonaws.com/index.html)'] NOAA Atmospheric Climate Data Records Ocean Heat Content arn:aws:s3:::noaa-cdr-ocean-heat-content-pds us-east-1 S3 Bucket https://www.ncei.noaa.gov/products/climate-data-records/atmospheric For questions regarding the specific CDR data holdings, please contact NCEI.SAT. [NOAA](http://www.noaa.gov/) Climate Data Records are updated independently. For update frequency for a speci Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, sustainability, weather ['[Browse Bucket](https://noaa-cdr-ocean-heat-content-pds.s3.amazonaws.com/index.html)'] NOAA Atmospheric Climate Data Records Ocean Heatflux arn:aws:s3:::noaa-cdr-ocean-heatflux-pds us-east-1 S3 Bucket https://www.ncei.noaa.gov/products/climate-data-records/atmospheric For questions regarding the specific CDR data holdings, please contact NCEI.SAT. [NOAA](http://www.noaa.gov/) Climate Data Records are updated independently. For update frequency for a speci Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, sustainability, weather ['[Browse Bucket](https://noaa-cdr-ocean-heatflux-pds.s3.amazonaws.com/index.html)'] NOAA Atmospheric Climate Data Records Ocean Nearsurface Atmos Profiles arn:aws:s3:::noaa-cdr-ocean-nearsurface-atmos-profiles-pds us-east-1 S3 Bucket https://www.ncei.noaa.gov/products/climate-data-records/atmospheric For questions regarding the specific CDR data holdings, please contact NCEI.SAT. [NOAA](http://www.noaa.gov/) Climate Data Records are updated independently. For update frequency for a speci Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, sustainability, weather ['[Browse Bucket](https://noaa-cdr-ocean-nearsurface-atmos-profiles-pds.s3.amazonaws.com/index.html)'] @@ -663,8 +663,8 @@ NOAA Geostationary Operational Environmental Satellites (GOES) 16, 17 & 18 New d NOAA Geostationary Operational Environmental Satellites (GOES) 16, 17 & 18 GOES-16 imagery and metadata arn:aws:s3:::noaa-goes16 us-east-1 S3 Bucket https://github.com/awslabs/open-data-docs/tree/main/docs/noaa/noaa-goes16 "For questions related to specific GOES Products, please visit the ""[GOES-R websi" [NOAA](http://www.noaa.gov/) New data is added as soon as it's available There are no restrictions on the use of this data. aws-pds, agriculture, geospatial, weather, earth observation, meteorological, disaster response, satellite imagery ['[Browse Bucket](https://noaa-goes16.s3.amazonaws.com/index.html)'] NOAA Geostationary Operational Environmental Satellites (GOES) 16, 17 & 18 New data notifications for GOES-18, only Lambda and SQS protocols allowed arn:aws:sns:us-east-1:123901341784:NewGOES18Object us-east-1 SNS Topic https://github.com/awslabs/open-data-docs/tree/main/docs/noaa/noaa-goes16 "For questions related to specific GOES Products, please visit the ""[GOES-R websi" [NOAA](http://www.noaa.gov/) New data is added as soon as it's available There are no restrictions on the use of this data. aws-pds, agriculture, geospatial, weather, earth observation, meteorological, disaster response, satellite imagery NOAA Geostationary Operational Environmental Satellites (GOES) 16, 17 & 18 GOES-18 imagery and metadata arn:aws:s3:::noaa-goes18 us-east-1 S3 Bucket https://github.com/awslabs/open-data-docs/tree/main/docs/noaa/noaa-goes16 "For questions related to specific GOES Products, please visit the ""[GOES-R websi" [NOAA](http://www.noaa.gov/) New data is added as soon as it's available There are no restrictions on the use of this data. aws-pds, agriculture, geospatial, weather, earth observation, meteorological, disaster response, satellite imagery ['[Browse Bucket](https://noaa-goes18.s3.amazonaws.com/index.html)'] -NOAA Global Data Assimilation (DA) Test Data Global Data Assimilation (DA) System Test Data arn:aws:s3:::noaa-ufs-gdas-pds us-east-1 S3 Bucket https://github.com/NOAA-EMC/GDASApp/wiki For questions regarding data content or quality, post on the ufs-community forum [NOAA](http://www.noaa.gov/) These are stable datasets for use with global DA projects. They will be updated GNU Lesser Public License v2.1: https://www.gnu.org/licenses/old-licenses/lgpl-2 aws-pds, agriculture, climate, disaster response, environmental, meteorological, weather ['[Browse Bucket](https://noaa-ufs-gdas-pds.s3.amazonaws.com/index.html)'] NOAA Global Data Assimilation (DA) Test Data New data notifications for Global Data Assimilation (DA) System Test Data, only arn:aws:sns:us-east-1:709902155096:NewNWSUFSGDASObject us-east-1 SNS Topic https://github.com/NOAA-EMC/GDASApp/wiki For questions regarding data content or quality, post on the ufs-community forum [NOAA](http://www.noaa.gov/) These are stable datasets for use with global DA projects. They will be updated GNU Lesser Public License v2.1: https://www.gnu.org/licenses/old-licenses/lgpl-2 aws-pds, agriculture, climate, disaster response, environmental, meteorological, weather +NOAA Global Data Assimilation (DA) Test Data Global Data Assimilation (DA) System Test Data arn:aws:s3:::noaa-ufs-gdas-pds us-east-1 S3 Bucket https://github.com/NOAA-EMC/GDASApp/wiki For questions regarding data content or quality, post on the ufs-community forum [NOAA](http://www.noaa.gov/) These are stable datasets for use with global DA projects. They will be updated GNU Lesser Public License v2.1: https://www.gnu.org/licenses/old-licenses/lgpl-2 aws-pds, agriculture, climate, disaster response, environmental, meteorological, weather ['[Browse Bucket](https://noaa-ufs-gdas-pds.s3.amazonaws.com/index.html)'] NOAA Global Ensemble Forecast System (GEFS) New data notifications for GFS, only Lambda and SQS protocols allowed arn:aws:sns:us-east-1:123901341784:NewGEFSObject us-east-1 SNS Topic https://github.com/awslabs/open-data-docs/tree/main/docs/noaa/noaa-gefs-pds For questions regarding data content or quality, visit [the NOAA GEFS site](http [NOAA](http://www.noaa.gov/) 4 times a day, every 6 hours starting at midnight. Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, weather NOAA Global Ensemble Forecast System (GEFS) Project data files arn:aws:s3:::noaa-gefs-pds us-east-1 S3 Bucket https://github.com/awslabs/open-data-docs/tree/main/docs/noaa/noaa-gefs-pds For questions regarding data content or quality, visit [the NOAA GEFS site](http [NOAA](http://www.noaa.gov/) 4 times a day, every 6 hours starting at midnight. Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, weather ['[Browse Bucket](https://noaa-gefs-pds.s3.amazonaws.com/index.html)'] NOAA Global Ensemble Forecast System (GEFS) Re-forecast GEFS Re-forecast in Grib2 Format arn:aws:s3:::noaa-gefs-retrospective us-east-1 S3 Bucket https://noaa-gefs-retrospective.s3.amazonaws.com/Description_of_reforecast_data. For any questions regarding data delivery or any general questions regarding the [NOAA](http://www.noaa.gov/) Re-forecasts do not adhere to an update frequency. Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, weather ['[Browse Bucket](https://noaa-gefs-retrospective.s3.amazonaws.com/index.html)'] @@ -712,11 +712,11 @@ NOAA National Blend of Models (NBM) National Blend of Models (NBM) Grib2 Format NOAA National Blend of Models (NBM) New data notifications for NBM-Grib2 Format, only Lambda and SQS protocols allow arn:aws:sns:us-east-1:123901341784:NewNBMGRIBObject us-east-1 SNS Topic https://vlab.noaa.gov/web/mdl/nbm For any questions regarding data delivery or any general questions regarding the [NOAA](http://www.noaa.gov/) Once per hour Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, cog, meteorological, weather NOAA National Digital Forecast Database (NDFD) National Digital Forecast Database (NDFD) Grib2 Format arn:aws:s3:::noaa-ndfd-pds us-east-1 S3 Bucket https://vlab.noaa.gov/web/mdl/ndfd (For NDFD Product information, instructions, For any questions regarding data delivery or any general questions regarding the [NOAA](http://www.noaa.gov/) As often as once every half hour (varies by forecast element, forecast projectio Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, weather ['[Browse Bucket](https://noaa-ndfd-pds.s3.amazonaws.com/index.html)'] NOAA National Digital Forecast Database (NDFD) New data notifications for NDFD, only Lambda and SQS protocols allowed arn:aws:sns:us-east-1:123901341784:NewNDFDObject us-east-1 SNS Topic https://vlab.noaa.gov/web/mdl/ndfd (For NDFD Product information, instructions, For any questions regarding data delivery or any general questions regarding the [NOAA](http://www.noaa.gov/) As often as once every half hour (varies by forecast element, forecast projectio Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, weather -NOAA National Water Model CONUS Retrospective Dataset The complete archive of NWM input forcing and model output data version 30 in N arn:aws:s3:::noaa-nwm-retrospective-3-0-pds us-east-1 S3 Bucket https://github.com/NOAA-Big-Data-Program/bdp-data-docs/blob/main/nwm/README.md For questions regarding data content or quality, email nws.nwc.ops@noaa.gov.For [NOAA](http://www.noaa.gov/) No updates Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, weather, climate, environmental, disaster response, agriculture, transportation ['[Browse Bucket](https://noaa-nwm-retrospective-3-0-pds.s3.amazonaws.com/index.html)'] +NOAA National Water Model CONUS Retrospective Dataset The complete archive of NWM model output data version 21 in Zarr format The NW arn:aws:s3:::noaa-nwm-retrospective-2-1-zarr-pds us-east-1 S3 Bucket https://github.com/NOAA-Big-Data-Program/bdp-data-docs/blob/main/nwm/README.md For questions regarding data content or quality, email nws.nwc.ops@noaa.gov.For [NOAA](http://www.noaa.gov/) No updates Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, weather, climate, environmental, disaster response, agriculture, transportation ['[Browse Bucket](https://noaa-nwm-retrospective-2-1-zarr-pds.s3.amazonaws.com/index.html)'] NOAA National Water Model CONUS Retrospective Dataset The complete archive of NWM data version 20 arn:aws:s3:::noaa-nwm-retro-v2-0-pds us-east-1 S3 Bucket https://github.com/NOAA-Big-Data-Program/bdp-data-docs/blob/main/nwm/README.md For questions regarding data content or quality, email nws.nwc.ops@noaa.gov.For [NOAA](http://www.noaa.gov/) No updates Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, weather, climate, environmental, disaster response, agriculture, transportation ['[Browse Bucket](https://noaa-nwm-retro-v2-0-pds.s3.amazonaws.com/index.html)'] NOAA National Water Model CONUS Retrospective Dataset The streamflow from the NWM version 20 in Zarr format arn:aws:s3:::noaa-nwm-retro-v2-zarr-pds us-west-2 S3 Bucket https://github.com/NOAA-Big-Data-Program/bdp-data-docs/blob/main/nwm/README.md For questions regarding data content or quality, email nws.nwc.ops@noaa.gov.For [NOAA](http://www.noaa.gov/) No updates Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, weather, climate, environmental, disaster response, agriculture, transportation ['[Browse Bucket](https://noaa-nwm-retro-v2-zarr-pds.s3.amazonaws.com/index.html)'] +NOAA National Water Model CONUS Retrospective Dataset The complete archive of NWM input forcing and model output data version 30 in N arn:aws:s3:::noaa-nwm-retrospective-3-0-pds us-east-1 S3 Bucket https://github.com/NOAA-Big-Data-Program/bdp-data-docs/blob/main/nwm/README.md For questions regarding data content or quality, email nws.nwc.ops@noaa.gov.For [NOAA](http://www.noaa.gov/) No updates Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, weather, climate, environmental, disaster response, agriculture, transportation ['[Browse Bucket](https://noaa-nwm-retrospective-3-0-pds.s3.amazonaws.com/index.html)'] NOAA National Water Model CONUS Retrospective Dataset The complete archive of NWM input forcing and model output data version 21 in N arn:aws:s3:::noaa-nwm-retrospective-2-1-pds us-east-1 S3 Bucket https://github.com/NOAA-Big-Data-Program/bdp-data-docs/blob/main/nwm/README.md For questions regarding data content or quality, email nws.nwc.ops@noaa.gov.For [NOAA](http://www.noaa.gov/) No updates Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, weather, climate, environmental, disaster response, agriculture, transportation ['[Browse Bucket](https://noaa-nwm-retrospective-2-1-pds.s3.amazonaws.com/index.html)'] -NOAA National Water Model CONUS Retrospective Dataset The complete archive of NWM model output data version 21 in Zarr format The NW arn:aws:s3:::noaa-nwm-retrospective-2-1-zarr-pds us-east-1 S3 Bucket https://github.com/NOAA-Big-Data-Program/bdp-data-docs/blob/main/nwm/README.md For questions regarding data content or quality, email nws.nwc.ops@noaa.gov.For [NOAA](http://www.noaa.gov/) No updates Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, weather, climate, environmental, disaster response, agriculture, transportation ['[Browse Bucket](https://noaa-nwm-retrospective-2-1-zarr-pds.s3.amazonaws.com/index.html)'] NOAA National Water Model CONUS Retrospective Dataset The complete archive of NWM data version 12 arn:aws:s3:::nwm-archive us-east-1 S3 Bucket https://github.com/NOAA-Big-Data-Program/bdp-data-docs/blob/main/nwm/README.md For questions regarding data content or quality, email nws.nwc.ops@noaa.gov.For [NOAA](http://www.noaa.gov/) No updates Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, weather, climate, environmental, disaster response, agriculture, transportation ['[Browse Bucket](https://nwm-archive.s3.amazonaws.com/index.html)'] NOAA National Water Model Short-Range Forecast Cloud-optimized zarr reference files managed by RPS Tetra Tech arn:aws:s3:::noaa-nodd-kerchunk-pds us-east-1 S3 Bucket https://github.com/awslabs/open-data-docs/tree/main/docs/noaa/noaa-nwm-pds For questions regarding data content or quality, go [here](http://water.noaa.gov [NOAA](http://www.noaa.gov/) Daily Open Data. There are no restrictions on the use of this data aws-pds, agriculture, weather, climate, environmental, disaster response, agriculture, transportation ['[Browse Bucket](https://noaa-nodd-kerchunk-pds.s3.amazonaws.com/index.html#nwm/)'] NOAA National Water Model Short-Range Forecast A rolling four week archive of NWM data arn:aws:s3:::noaa-nwm-pds us-east-1 S3 Bucket https://github.com/awslabs/open-data-docs/tree/main/docs/noaa/noaa-nwm-pds For questions regarding data content or quality, go [here](http://water.noaa.gov [NOAA](http://www.noaa.gov/) Daily Open Data. There are no restrictions on the use of this data aws-pds, agriculture, weather, climate, environmental, disaster response, agriculture, transportation ['[Browse Bucket](https://noaa-nwm-pds.s3.amazonaws.com/index.html)'] @@ -751,8 +751,8 @@ NOAA Space Weather Forecast and Observation Data New data notifications for NOAA NOAA Terrestrial Climate Data Records Leaf Area Index arn:aws:s3:::noaa-cdr-leaf-area-index-fapar-pds us-east-1 S3 Bucket https://www.ncdc.noaa.gov/cdr For questions regarding the specific CDR data holdings, please contact NCEI.SAT. [NOAA](http://www.noaa.gov/) Climate Data Records are updated independently. For update frequency for a speci Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, sustainability, weather ['[Browse Bucket](https://noaa-cdr-leaf-area-index-fapar-pds.s3.amazonaws.com/index.html)'] NOAA Terrestrial Climate Data Records Snow Cover Extent arn:aws:s3:::noaa-cdr-snow-cover-ext-north-pds us-east-1 S3 Bucket https://www.ncdc.noaa.gov/cdr For questions regarding the specific CDR data holdings, please contact NCEI.SAT. [NOAA](http://www.noaa.gov/) Climate Data Records are updated independently. For update frequency for a speci Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, sustainability, weather ['[Browse Bucket](https://noaa-cdr-snow-cover-ext-north-pds.s3.amazonaws.com/index.html)'] NOAA Terrestrial Climate Data Records NDVI arn:aws:s3:::noaa-cdr-ndvi-pds us-east-1 S3 Bucket https://www.ncdc.noaa.gov/cdr For questions regarding the specific CDR data holdings, please contact NCEI.SAT. [NOAA](http://www.noaa.gov/) Climate Data Records are updated independently. For update frequency for a speci Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, sustainability, weather ['[Browse Bucket](https://noaa-cdr-ndvi-pds.s3.amazonaws.com/index.html)'] -NOAA U.S. Climate Gridded Dataset (NClimGrid) New data notifications for Daily NClimGrid, only Lambda and SQS protocols allowe arn:aws:sns:us-east-1:123901341784:NewNClimGridMonthlyObject us-east-1 SNS Topic https://www.ncei.noaa.gov/access/metadata/landing-page/bin/iso?id=gov.noaa.ncdc: For any questions regarding data delivery or any general questions regarding the [NOAA](http://www.noaa.gov/) Monthly Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, weather NOAA U.S. Climate Gridded Dataset (NClimGrid) Monthly NClimGrid Data arn:aws:s3:::noaa-nclimgrid-monthly-pds us-east-1 S3 Bucket https://www.ncei.noaa.gov/access/metadata/landing-page/bin/iso?id=gov.noaa.ncdc: For any questions regarding data delivery or any general questions regarding the [NOAA](http://www.noaa.gov/) Monthly Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, weather ['[Browse Bucket](https://noaa-nclimgrid-monthly-pds.s3.amazonaws.com/index.html)'] +NOAA U.S. Climate Gridded Dataset (NClimGrid) New data notifications for Daily NClimGrid, only Lambda and SQS protocols allowe arn:aws:sns:us-east-1:123901341784:NewNClimGridMonthlyObject us-east-1 SNS Topic https://www.ncei.noaa.gov/access/metadata/landing-page/bin/iso?id=gov.noaa.ncdc: For any questions regarding data delivery or any general questions regarding the [NOAA](http://www.noaa.gov/) Monthly Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, weather NOAA U.S. Climate Gridded Dataset (NClimGrid) New data notifications for Daily NClimGrid, only Lambda and SQS protocols allowe arn:aws:sns:us-east-1:123901341784:NewNClimGridDailyObject us-east-1 SNS Topic https://www.ncei.noaa.gov/access/metadata/landing-page/bin/iso?id=gov.noaa.ncdc: For any questions regarding data delivery or any general questions regarding the [NOAA](http://www.noaa.gov/) Monthly Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, weather NOAA U.S. Climate Gridded Dataset (NClimGrid) Daily NClimGrid Data arn:aws:s3:::noaa-nclimgrid-daily-pds us-east-1 S3 Bucket https://www.ncei.noaa.gov/access/metadata/landing-page/bin/iso?id=gov.noaa.ncdc: For any questions regarding data delivery or any general questions regarding the [NOAA](http://www.noaa.gov/) Monthly Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, weather ['[Browse Bucket](https://noaa-nclimgrid-daily-pds.s3.amazonaws.com/index.html)'] NOAA U.S. Climate Normals US Climate Normals Data arn:aws:s3:::noaa-normals-pds us-east-1 S3 Bucket [https://www.ncei.noaa.gov/products/us-climate-normals](https://www.ncei.noaa.go For any questions regarding data delivery or any general questions regarding the [NOAA](http://www.noaa.gov/) Data is updated on 10 year cycles or when corrections are implemented. Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, sustainability, weather ['[Browse Bucket](https://noaa-normals-pds.s3.amazonaws.com/index.html)'] @@ -774,8 +774,8 @@ NOAA Wang Sheeley Arge (WSA) Enlil NOAA WSA-Enlil Products arn:aws:s3:::noaa-wsa NOAA Water-Column Sonar Data Archive NCEI Water-Column Sonar Data Archive arn:aws:s3:::noaa-wcsd-pds us-east-1 S3 Bucket https://cires.gitbook.io/ncei-wcsd-archive/ wcd.info@noaa.gov [NOAA](https://www.ngdc.noaa.gov/mgg/wcd/) New water-column sonar data are added regularly as they are provided to the arch The data may be used and redistributed for free but is not intended for legal us aws-pds, earth observation, biodiversity, ecosystems, environmental, geospatial, mapping, oceans ['[Browse Bucket](https://noaa-wcsd-pds.s3.amazonaws.com/index.html)'] NOAA Wave Ensemble Reforecast NOAA Wave Ensemble Reforecast Data arn:aws:s3:::noaa-nws-gefswaves-reforecast-pds us-east-1 S3 Bucket https://github.com/NOAA-EMC/gefswaves_reforecast/wiki https://github.com/NOAA-E For questions related to wave modeling and the ensemble reforecast available, pl [NOAA](http://www.noaa.gov/) Quarterly Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, weather ['[Browse Bucket](https://noaa-nws-gefswaves-reforecast-pds.s3.amazonaws.com/index.html)'] NOAA Wave Ensemble Reforecast New data notifications for NOAA Wave Ensemble Reforecast, only Lambda and SQS pr arn:aws:sns:us-east-1:709902155096:NewWERObject us-east-1 SNS Topic https://github.com/NOAA-EMC/gefswaves_reforecast/wiki https://github.com/NOAA-E For questions related to wave modeling and the ensemble reforecast available, pl [NOAA](http://www.noaa.gov/) Quarterly Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, climate, meteorological, weather -NOAA Whole Atmosphere Model-Ionosphere Plasmasphere Electrodynamics (WAM-IPE) Forecast System (WFS) New data notifications for NOAA WAM-IPE Products, only Lambda and SQS protocols arn:aws:sns:us-east-1:709902155096:NewWIFSObject us-east-1 SNS Topic https://www.swpc.noaa.gov/products/wam-ipe For any questions regarding WAM-IPE data, please contact Adam Kubaryk (adam.kuba [NOAA](http://www.noaa.gov/) The update frequencies of the WAM-IPE dataset range from 10 minutes to 6 hours d CC-0, Open Data. There are no restrictions on the use of this data. aws-pds, climate, meteorological, solar, weather NOAA Whole Atmosphere Model-Ionosphere Plasmasphere Electrodynamics (WAM-IPE) Forecast System (WFS) NOAA WAM-IPE Products arn:aws:s3:::noaa-nws-wam-ipe-pds us-east-1 S3 Bucket https://www.swpc.noaa.gov/products/wam-ipe For any questions regarding WAM-IPE data, please contact Adam Kubaryk (adam.kuba [NOAA](http://www.noaa.gov/) The update frequencies of the WAM-IPE dataset range from 10 minutes to 6 hours d CC-0, Open Data. There are no restrictions on the use of this data. aws-pds, climate, meteorological, solar, weather ['[Browse Bucket](https://noaa-nws-wam-ipe-pds.s3.amazonaws.com/index.html)'] +NOAA Whole Atmosphere Model-Ionosphere Plasmasphere Electrodynamics (WAM-IPE) Forecast System (WFS) New data notifications for NOAA WAM-IPE Products, only Lambda and SQS protocols arn:aws:sns:us-east-1:709902155096:NewWIFSObject us-east-1 SNS Topic https://www.swpc.noaa.gov/products/wam-ipe For any questions regarding WAM-IPE data, please contact Adam Kubaryk (adam.kuba [NOAA](http://www.noaa.gov/) The update frequencies of the WAM-IPE dataset range from 10 minutes to 6 hours d CC-0, Open Data. There are no restrictions on the use of this data. aws-pds, climate, meteorological, solar, weather NOAA World Ocean Database (WOD) World Ocean Database (WOD) NetCDF Format arn:aws:s3:::noaa-wod-pds us-east-1 S3 Bucket https://www.nodc.noaa.gov/OC5/WOD/pr_wod.html For any questions regarding data delivery not associated with this platform or a [NOAA](http://www.noaa.gov/) Data is update on a quarterly basis Open Data. There are no restrictions on the use of this data. aws-pds, climate, oceans ['[Browse Bucket](https://noaa-wod-pds.s3.amazonaws.com/index.html)'] NOAA's Coastal Ocean Reanalysis (CORA) Dataset NOAA’s Coastal Ocean Reanalysis (CORA) Dataset NetCDF arn:aws:s3:::noaa-nos-cora-pds us-east-1 S3 Bucket https://tidesandcurrents.noaa.gov/ For questions regarding data content or quality, email CO-OPS.UserServices@noaa. [NOAA’s National Ocean Service, The Center for Operational Oceanographic Product Monthly, quarterly, and annually, depending on the dataset. Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, weather, climate, environmental, disaster response, agriculture, transportation, oceans ['[Browse Bucket](https://noaa-nos-cora-pds.s3.amazonaws.com/index.html)'] NOAA's Coastal Ocean Reanalysis (CORA) Dataset NOAA’s Coastal Ocean Reanalysis (CORA) Dataset Notifications arn:aws:sns:us-east-1:709902155096:NewNOSCORAObject us-east-1 SNS Topic https://tidesandcurrents.noaa.gov/ For questions regarding data content or quality, email CO-OPS.UserServices@noaa. [NOAA’s National Ocean Service, The Center for Operational Oceanographic Product Monthly, quarterly, and annually, depending on the dataset. Open Data. There are no restrictions on the use of this data. aws-pds, agriculture, weather, climate, environmental, disaster response, agriculture, transportation, oceans @@ -816,19 +816,19 @@ NREL Wind Integration National Dataset NW Pacific Wind Resource data for (2000-2 NREL Wind Integration National Dataset Techno-economic subset of the WIND Toolkit by location in netCDF arn:aws:s3:::nrel-pds-wtk/wtk-techno-economic/pywtk-data/ us-west-2 S3 Bucket https://www.nrel.gov/grid/wind-toolkit.html wind-toolkit@nrel.gov [National Renewable Energy Laboratory](https://www.nrel.gov/) As Needed Creative Commons Attribution 3.0 United States License aws-pds, environmental, geospatial, meteorological ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=wtk-techno-economic%2Fpywtk-data%2F)'] NREL Wind Integration National Dataset Vietnam wind resource data (2016-2018) in HDF5 format arn:aws:s3:::nrel-pds-wtk/vietnam/ us-west-2 S3 Bucket https://www.nrel.gov/grid/wind-toolkit.html wind-toolkit@nrel.gov [National Renewable Energy Laboratory](https://www.nrel.gov/) As Needed Creative Commons Attribution 3.0 United States License aws-pds, environmental, geospatial, meteorological ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=vietnam%2F)'] NREL Wind Integration National Dataset Southeast Asia wind resource data (2017-2021) in HDF5 format arn:aws:s3:::nrel-pds-wtk/seasiawind/ us-west-2 S3 Bucket https://www.nrel.gov/grid/wind-toolkit.html wind-toolkit@nrel.gov [National Renewable Energy Laboratory](https://www.nrel.gov/) As Needed Creative Commons Attribution 3.0 United States License aws-pds, environmental, geospatial, meteorological ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=seasiawind%2F)'] +NREL Wind Integration National Dataset California offshore wind resource data (2000-2022) in HDF5 format arn:aws:s3:::nrel-pds-wtk/now23_california/ us-west-2 S3 Bucket https://www.nrel.gov/grid/wind-toolkit.html wind-toolkit@nrel.gov [National Renewable Energy Laboratory](https://www.nrel.gov/) As Needed Creative Commons Attribution 3.0 United States License aws-pds, environmental, geospatial, meteorological ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=now23_california%2F)'] NREL Wind Integration National Dataset Bias corrected Indonesia wind resource arn:aws:s3:::nrel-pds-wtk/indonesia/ us-west-2 S3 Bucket https://www.nrel.gov/grid/wind-toolkit.html wind-toolkit@nrel.gov [National Renewable Energy Laboratory](https://www.nrel.gov/) As Needed Creative Commons Attribution 3.0 United States License aws-pds, environmental, geospatial, meteorological ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=indonesia%2F)'] NREL Wind Integration National Dataset Mid Atlantic wind resource data with modeled wakes in HDF5 format arn:aws:s3:::nrel-pds-wtk/NOW-WAKES_Mid_Atlantic/ us-west-2 S3 Bucket https://www.nrel.gov/grid/wind-toolkit.html wind-toolkit@nrel.gov [National Renewable Energy Laboratory](https://www.nrel.gov/) As Needed Creative Commons Attribution 3.0 United States License aws-pds, environmental, geospatial, meteorological ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=NOW-WAKES_Mid_Atlantic%2F)'] NREL Wind Integration National Dataset Southeast Asia wind resource data v3 (2007-2021) in HDF5 format arn:aws:s3:::nrel-pds-wtk/seasiawind_v3/ us-west-2 S3 Bucket https://www.nrel.gov/grid/wind-toolkit.html wind-toolkit@nrel.gov [National Renewable Energy Laboratory](https://www.nrel.gov/) As Needed Creative Commons Attribution 3.0 United States License aws-pds, environmental, geospatial, meteorological ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=seasiawind_v3%2F)'] NREL Wind Integration National Dataset Southeast Asia wind resource data v2 (2007-2021) in HDF5 format arn:aws:s3:::nrel-pds-wtk/seasiawind_v2/ us-west-2 S3 Bucket https://www.nrel.gov/grid/wind-toolkit.html wind-toolkit@nrel.gov [National Renewable Energy Laboratory](https://www.nrel.gov/) As Needed Creative Commons Attribution 3.0 United States License aws-pds, environmental, geospatial, meteorological ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=seasiawind_v2%2F)'] -NREL Wind Integration National Dataset Data for the Eastern Wind Integration Study (2004-2006 arn:aws:s3:::nrel-pds-wtk/eastern_wind/ us-west-2 S3 Bucket https://www.nrel.gov/grid/wind-toolkit.html wind-toolkit@nrel.gov [National Renewable Energy Laboratory](https://www.nrel.gov/) As Needed Creative Commons Attribution 3.0 United States License aws-pds, environmental, geospatial, meteorological ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=eastern_wind%2F)'] NREL Wind Integration National Dataset Puerto Rico wind resource data (2001-2020) in HDF5 format arn:aws:s3:::nrel-pds-wtk/pr100/ us-west-2 S3 Bucket https://www.nrel.gov/grid/wind-toolkit.html wind-toolkit@nrel.gov [National Renewable Energy Laboratory](https://www.nrel.gov/) As Needed Creative Commons Attribution 3.0 United States License aws-pds, environmental, geospatial, meteorological ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=pr100%2F)'] -NREL Wind Integration National Dataset California offshore wind resource data (2000-2022) in HDF5 format arn:aws:s3:::nrel-pds-wtk/now23_california/ us-west-2 S3 Bucket https://www.nrel.gov/grid/wind-toolkit.html wind-toolkit@nrel.gov [National Renewable Energy Laboratory](https://www.nrel.gov/) As Needed Creative Commons Attribution 3.0 United States License aws-pds, environmental, geospatial, meteorological ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=now23_california%2F)'] +NREL Wind Integration National Dataset South Atlantic offshore wind resource data (2000-2020) in HDF5 format arn:aws:s3:::nrel-pds-wtk/south_atlantic/ us-west-2 S3 Bucket https://www.nrel.gov/grid/wind-toolkit.html wind-toolkit@nrel.gov [National Renewable Energy Laboratory](https://www.nrel.gov/) As Needed Creative Commons Attribution 3.0 United States License aws-pds, environmental, geospatial, meteorological ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=south_atlantic)'] NREL Wind Integration National Dataset Philippines typical meteorological year data in HDF5 format arn:aws:s3:::nrel-pds-wtk/philippines_tmy/ us-west-2 S3 Bucket https://www.nrel.gov/grid/wind-toolkit.html wind-toolkit@nrel.gov [National Renewable Energy Laboratory](https://www.nrel.gov/) As Needed Creative Commons Attribution 3.0 United States License aws-pds, environmental, geospatial, meteorological ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=philippines_tmy%2F)'] NREL Wind Integration National Dataset Great Lakes wind resource data (2000-2020) in HDF5 format arn:aws:s3:::nrel-pds-wtk/Great_Lakes/ us-west-2 S3 Bucket https://www.nrel.gov/grid/wind-toolkit.html wind-toolkit@nrel.gov [National Renewable Energy Laboratory](https://www.nrel.gov/) As Needed Creative Commons Attribution 3.0 United States License aws-pds, environmental, geospatial, meteorological ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=Great_Lakes%2F)'] -NREL Wind Integration National Dataset Mid Atlantic three-dimensional planetary boundary layer (3D PBL) scheme wind res arn:aws:s3:::nrel-pds-wtk/mid_atlantic_3d_pbl/ us-west-2 S3 Bucket https://www.nrel.gov/grid/wind-toolkit.html wind-toolkit@nrel.gov [National Renewable Energy Laboratory](https://www.nrel.gov/) As Needed Creative Commons Attribution 3.0 United States License aws-pds, environmental, geospatial, meteorological ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=mid_atlantic_3d_pbl%2F)'] -NREL Wind Integration National Dataset Data for the Western Wind Integration Study (2004-2006 arn:aws:s3:::nrel-pds-wtk/western_wind/ us-west-2 S3 Bucket https://www.nrel.gov/grid/wind-toolkit.html wind-toolkit@nrel.gov [National Renewable Energy Laboratory](https://www.nrel.gov/) As Needed Creative Commons Attribution 3.0 United States License aws-pds, environmental, geospatial, meteorological ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=western_wind%2F)'] NREL Wind Integration National Dataset Bias Corrected NOAA HRRR Wind Resource Data for Grid Integration Applications arn:aws:s3:::nrel-pds-wtk/bchrrr/ us-west-2 S3 Bucket https://www.nrel.gov/grid/wind-toolkit.html wind-toolkit@nrel.gov [National Renewable Energy Laboratory](https://www.nrel.gov/) As Needed Creative Commons Attribution 3.0 United States License aws-pds, environmental, geospatial, meteorological ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=bchrrr%2F)'] -NREL Wind Integration National Dataset South Atlantic offshore wind resource data (2000-2020) in HDF5 format arn:aws:s3:::nrel-pds-wtk/south_atlantic/ us-west-2 S3 Bucket https://www.nrel.gov/grid/wind-toolkit.html wind-toolkit@nrel.gov [National Renewable Energy Laboratory](https://www.nrel.gov/) As Needed Creative Commons Attribution 3.0 United States License aws-pds, environmental, geospatial, meteorological ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=south_atlantic)'] +NREL Wind Integration National Dataset Data for the Western Wind Integration Study (2004-2006 arn:aws:s3:::nrel-pds-wtk/western_wind/ us-west-2 S3 Bucket https://www.nrel.gov/grid/wind-toolkit.html wind-toolkit@nrel.gov [National Renewable Energy Laboratory](https://www.nrel.gov/) As Needed Creative Commons Attribution 3.0 United States License aws-pds, environmental, geospatial, meteorological ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=western_wind%2F)'] +NREL Wind Integration National Dataset Data for the Eastern Wind Integration Study (2004-2006 arn:aws:s3:::nrel-pds-wtk/eastern_wind/ us-west-2 S3 Bucket https://www.nrel.gov/grid/wind-toolkit.html wind-toolkit@nrel.gov [National Renewable Energy Laboratory](https://www.nrel.gov/) As Needed Creative Commons Attribution 3.0 United States License aws-pds, environmental, geospatial, meteorological ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=eastern_wind%2F)'] +NREL Wind Integration National Dataset Mid Atlantic three-dimensional planetary boundary layer (3D PBL) scheme wind res arn:aws:s3:::nrel-pds-wtk/mid_atlantic_3d_pbl/ us-west-2 S3 Bucket https://www.nrel.gov/grid/wind-toolkit.html wind-toolkit@nrel.gov [National Renewable Energy Laboratory](https://www.nrel.gov/) As Needed Creative Commons Attribution 3.0 United States License aws-pds, environmental, geospatial, meteorological ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=mid_atlantic_3d_pbl%2F)'] NSF NCAR Curated ECMWF Reanalysis 5 (ERA5) Notifications for the NSF NCAR ERA5 bucket arn:aws:sns:us-west-2:891377163634:nsf-ncar-era5-object_created us-west-2 SNS Topic https://doi.org/10.5065/BH6N-5N20 rdahelp@ucar.edu [NSF National Center for Atmospheric Research](https://ncar.ucar.edu/) Monthly, with a 3-4 month lag from realtime https://www.ucar.edu/terms-of-use/data climate, model, atmosphere, land, data assimilation, forecast, meteorological, weather, geoscience, geospatial, aws-pds, netcdf NSF NCAR Curated ECMWF Reanalysis 5 (ERA5) ERA5 NetCDF4 Data Files arn:aws:s3:::nsf-ncar-era5 us-west-2 S3 Bucket https://doi.org/10.5065/BH6N-5N20 rdahelp@ucar.edu [NSF National Center for Atmospheric Research](https://ncar.ucar.edu/) Monthly, with a 3-4 month lag from realtime https://www.ucar.edu/terms-of-use/data climate, model, atmosphere, land, data assimilation, forecast, meteorological, weather, geoscience, geospatial, aws-pds, netcdf ['[Browse Bucket](https://nsf-ncar-era5.s3.amazonaws.com/index.html)'] NYU Langone & FAIR FastMRI Dataset Raw k-space data and DICOM files for a knee and brain dataset in a public S3 buc arn:aws:s3:::fastmri-dataset us-east-1 S3 Bucket https://fastmri.med.nyu.edu/ [Florian Knoll](florian.knoll@nyuangone.org) [FastMRI](https://fastmri.med.nyu.edu/) The dataset is estimated to grow annually to include MRI raw data and imaging fo MIT License aws-pds, life sciences, health, imaging, biology, image processing, neurobiology, neuroimaging, magnetic resonance imaging https://fastmri.med.nyu.edu/ @@ -922,14 +922,14 @@ Open Observatory of Network Interference (OONI) New S3 bucket with JSONL files a Open Observatory of Network Interference (OONI) Old S3 bucket with cans for older measurements arn:aws:s3:::ooni-data us-east-1 S3 Bucket https://ooni.org/data/ https://ooni.org/get-involved/ Open Observatory of Network Interference Hourly Creative Commons Attribution-NonCommercial-ShareAlike 4.0 International https:// aws-pds, internet Open VLF: Scientific Open Data Initiative for CRAAM's SAVNET and AWESOME VLF Data. The Open VLF Files Total size of 736 GB arn:aws:s3:::craam-files-bucket sa-east-1 S3 Bucket [Open VLF](https://open-vlf.web.app) [Open VLF Feedback](https://open-vlf.web.app/markdown/the-project) [CRAAM Mackenzie](https://www.mackenzie.br/centro-de-radio-astronomia-e-astrofis Various. Data since 2006, and still updated. Follow the announcements and what i There are no restrictions on the use of this data. archives, astronomy, atmosphere, aws-pds, global, open source software, signal processing, life sciences Open-Meteo Weather API Database Open-Meteo Weather API Database arn:aws:s3:::openmeteo us-west-2 S3 Bucket https://github.com/open-meteo/open-data info@open-meteo.com [Open-Meteo](https://www.open-meteo.com/) Hourly CC-BY 4.0 aws-pds, agriculture, climate, earth observation, meteorological, weather ['[Browse Bucket](https://openmeteo.s3.amazonaws.com/index.html#data/)'] -OpenAQ OpenAQ API us-east-1 CloudFront Distribution https://openaq.org info@openaq.org [OpenAQ](https://openaq.org) Hourly Varies, depends on data provider aws-pds, air quality, cities, environmental, geospatial api.openaq.org OpenAQ SNS topic for new objects in the openaq-data-archive bucket arn:aws:sns:us-east-1:817926761842:openaq-data-archive-object_created us-east-1 SNS Topic https://openaq.org info@openaq.org [OpenAQ](https://openaq.org) Hourly Varies, depends on data provider aws-pds, air quality, cities, environmental, geospatial OpenAQ Daily gzipped CSVs of global air quality measurements fetched from sources all o arn:aws:s3:::openaq-data-archive us-east-1 S3 Bucket https://openaq.org info@openaq.org [OpenAQ](https://openaq.org) Hourly Varies, depends on data provider aws-pds, air quality, cities, environmental, geospatial +OpenAQ OpenAQ API us-east-1 CloudFront Distribution https://openaq.org info@openaq.org [OpenAQ](https://openaq.org) Hourly Varies, depends on data provider aws-pds, air quality, cities, environmental, geospatial api.openaq.org OpenAerialMap on AWS OpenAerialMap files and metadata arn:aws:s3:::oin-hotosm us-east-1 S3 Bucket https://docs.openaerialmap.org/ info@openaerialmap.org [Humanitarian OpenStreetMap Team](https://www.hotosm.org/) New imagery is added as soon as it is uploaded by community contributors. All imagery is publicly licensed CC-BY 4.0, with attribution as contributors of satellite imagery, aerial imagery, earth observation, disaster response, cog ['[Browse Bucket](https://oin-hotosm.s3.amazonaws.com/)'] -OpenAlex dataset Openalex Entities decomposed to tab-separated columnar files for backward compat arn:aws:s3:::openalex-mag-format us-east-1 S3 Bucket https://docs.openalex.org team@ourresearch.org [OurResearch](https://ourresearch.org/) Approximately monthly [CC0](https://creativecommons.org/publicdomain/zero/1.0/) graph, json, metadata, scholarly communication, aws-pds ['[Browse Bucket](https://openalex-mag-format.s3.amazonaws.com/browse.html)'] OpenAlex dataset OpenAlex Entities in JSON Lines format arn:aws:s3:::openalex us-east-1 S3 Bucket https://docs.openalex.org team@ourresearch.org [OurResearch](https://ourresearch.org/) Approximately monthly [CC0](https://creativecommons.org/publicdomain/zero/1.0/) graph, json, metadata, scholarly communication, aws-pds ['[Browse Bucket](https://openalex.s3.amazonaws.com/browse.html)'] -OpenCRAVAT OpenCRAVAT Store EU arn:aws:s3:::opencravat-store-eu-west-2 eu-west-2 S3 Bucket https://open-cravat.readthedocs.io support@opencravat.org KarchinLab, Potomac IT Group Data is mirrored daily. Update frequencies of individual annotators depend on th "License varies per-annotator. Commercial users must check the ""commercial_warnin" aws-pds, genetic, genomic, life sciences, variant annotation, sqlite, tertiary analysis +OpenAlex dataset Openalex Entities decomposed to tab-separated columnar files for backward compat arn:aws:s3:::openalex-mag-format us-east-1 S3 Bucket https://docs.openalex.org team@ourresearch.org [OurResearch](https://ourresearch.org/) Approximately monthly [CC0](https://creativecommons.org/publicdomain/zero/1.0/) graph, json, metadata, scholarly communication, aws-pds ['[Browse Bucket](https://openalex-mag-format.s3.amazonaws.com/browse.html)'] OpenCRAVAT OpenCRAVAT Store US arn:aws:s3:::opencravat-store-aws us-east-1 S3 Bucket https://open-cravat.readthedocs.io support@opencravat.org KarchinLab, Potomac IT Group Data is mirrored daily. Update frequencies of individual annotators depend on th "License varies per-annotator. Commercial users must check the ""commercial_warnin" aws-pds, genetic, genomic, life sciences, variant annotation, sqlite, tertiary analysis +OpenCRAVAT OpenCRAVAT Store EU arn:aws:s3:::opencravat-store-eu-west-2 eu-west-2 S3 Bucket https://open-cravat.readthedocs.io support@opencravat.org KarchinLab, Potomac IT Group Data is mirrored daily. Update frequencies of individual annotators depend on th "License varies per-annotator. Commercial users must check the ""commercial_warnin" aws-pds, genetic, genomic, life sciences, variant annotation, sqlite, tertiary analysis OpenCell on AWS Live-cell confocal fluorescence microscopy images of the OpenCell library of flu arn:aws:s3:::czb-opencell us-west-2 S3 Bucket https://opencell.czbiohub.org/download opencell@czbiohub.org [Chan Zuckerberg Biohub](https://www.czbiohub.org/) This is the final version of the dataset. https://github.com/czbiohub/opencell/blob/master/LICENSE aws-pds, biology, cell biology, life sciences, imaging, cell imaging, fluorescence imaging, microscopy, computer vision, machine learning OpenEEW OpenEEW arn:aws:s3:::grillo-openeew us-east-1 S3 Bucket https://github.com/openeew/openeew hello@openeew.com [Grillo](https://grillo.io/) Approximately every 5 minutes https://github.com/openeew/openeew#license disaster response, earth observation, earthquakes, aws-pds ['[Browse Bucket](https://grillo-openeew.s3.amazonaws.com/index.html)'] OpenNeuro MRI, MEG, EEG, iEEG, and ECoG datasets from OpenNeuro arn:aws:s3:::openneuro.org us-east-1 S3 Bucket http://openneuro.org Support form at https://openneuro.org [Stanford University Center for Reproducible Neuroscience](https://reproducibili New datasets deposited every 4-6 days CC0 aws-pds, biology, imaging, life sciences, neurobiology, neuroimaging @@ -937,19 +937,19 @@ OpenProteinSet A repository of MSAs and template hits arn:aws:s3:::openfold us-e OpenStreetMap on AWS New data notifications arn:aws:sns:us-east-1:800218804198:New_File us-east-1 SNS Topic https://github.com/awslabs/open-data-docs/tree/main/docs/osm-pds https://github.com/mojodna/osm-pds-pipelines/issues Pacific Atlas Data is updated weekly https://www.openstreetmap.org/copyright aws-pds, geospatial, mapping, osm, disaster response OpenStreetMap on AWS Imagery and metadata arn:aws:s3:::osm-pds us-east-1 S3 Bucket https://github.com/awslabs/open-data-docs/tree/main/docs/osm-pds https://github.com/mojodna/osm-pds-pipelines/issues Pacific Atlas Data is updated weekly https://www.openstreetmap.org/copyright aws-pds, geospatial, mapping, osm, disaster response OpenSurfaces OpenSurfaces data arn:aws:s3:::labelmaterial us-east-1 S3 Bucket http://opensurfaces.cs.cornell.edu/publications/opensurfaces/ snavely@cs.cornell.edu Cornell University Static dataset (not updated) The annotations are licensed under a Creative Commons Attribution 4.0 Internatio computer vision, aws-pds ['[Browse data on project webpage](http://opensurfaces.cs.cornell.edu/)'] -OpenUniverse 2024 Matched Rubin and Roman Simulations: Preview The simulated Rubin data products include raw pixel data, calibrated exposures, arn:aws:s3:::nasa-irsa-simulations/openuniverse2024/rubin/ us-east-1 S3 Bucket https://irsa.ipac.caltech.edu/data/theory/openuniverse2024 https://irsa.ipac.caltech.edu/docs/help_desk.html NASA/IPAC Infrared Science Archive ([IRSA](https://irsa.ipac.caltech.edu)) at Ca The OpenUniverse 2024 Data Preview has been finalized and will not be updated. https://irsa.ipac.caltech.edu/data_use_terms.html aws-pds, astronomy, imaging, object detection, parquet, satellite imagery, simulations, survey False False OpenUniverse 2024 Matched Rubin and Roman Simulations: Preview The simulated Roman data products include truth files listing the basic physical arn:aws:s3:::nasa-irsa-simulations/openuniverse2024/roman/ us-east-1 S3 Bucket https://irsa.ipac.caltech.edu/data/theory/openuniverse2024 https://irsa.ipac.caltech.edu/docs/help_desk.html NASA/IPAC Infrared Science Archive ([IRSA](https://irsa.ipac.caltech.edu)) at Ca The OpenUniverse 2024 Data Preview has been finalized and will not be updated. https://irsa.ipac.caltech.edu/data_use_terms.html aws-pds, astronomy, imaging, object detection, parquet, satellite imagery, simulations, survey False False +OpenUniverse 2024 Matched Rubin and Roman Simulations: Preview The simulated Rubin data products include raw pixel data, calibrated exposures, arn:aws:s3:::nasa-irsa-simulations/openuniverse2024/rubin/ us-east-1 S3 Bucket https://irsa.ipac.caltech.edu/data/theory/openuniverse2024 https://irsa.ipac.caltech.edu/docs/help_desk.html NASA/IPAC Infrared Science Archive ([IRSA](https://irsa.ipac.caltech.edu)) at Ca The OpenUniverse 2024 Data Preview has been finalized and will not be updated. https://irsa.ipac.caltech.edu/data_use_terms.html aws-pds, astronomy, imaging, object detection, parquet, satellite imagery, simulations, survey False False Opioid Industry Documents Archive (OIDA) Data on AWS Raw data from the Opioid Industry Documents Archive (OIDA), including documents arn:aws:s3:::opioid-industry-documents-archive-dataset-bucket us-east-1 S3 Bucket https://opioid-industry-documents-archive-dataset-bucket.s3.amazonaws.com/index. opioidarchive@jh.edu Johns Hopkins University monthly https://www.industrydocuments.ucsf.edu/opioids/help/copyright/ aws-pds, archives, text analysis, txt, pharmaceutical, life sciences -Orcasound - bioacoustic data for marine conservation Live-streamed orca audio data (HLS) arn:aws:s3:::streaming-orcasound-net us-west-2 S3 Bucket https://github.com/orcasound/orcadata/wiki info@orcasound.net Orcasound Typical latency is 10-120 seconds https://creativecommons.org/licenses/by-nc-sa/4.0/ aws-pds, biodiversity, biology, coastal, conservation, deep learning, ecosystems, environmental, geospatial, labeled, machine learning, mapping, oceans, open source software, signal processing Orcasound - bioacoustic data for marine conservation Archived lossless orca audio data (FLAC) arn:aws:s3:::archive-orcasound-net us-west-2 S3 Bucket https://github.com/orcasound/orcadata/wiki info@orcasound.net Orcasound Typical latency is 10-120 seconds https://creativecommons.org/licenses/by-nc-sa/4.0/ aws-pds, biodiversity, biology, coastal, conservation, deep learning, ecosystems, environmental, geospatial, labeled, machine learning, mapping, oceans, open source software, signal processing +Orcasound - bioacoustic data for marine conservation Live-streamed orca audio data (HLS) arn:aws:s3:::streaming-orcasound-net us-west-2 S3 Bucket https://github.com/orcasound/orcadata/wiki info@orcasound.net Orcasound Typical latency is 10-120 seconds https://creativecommons.org/licenses/by-nc-sa/4.0/ aws-pds, biodiversity, biology, coastal, conservation, deep learning, ecosystems, environmental, geospatial, labeled, machine learning, mapping, oceans, open source software, signal processing Orcasound - bioacoustic data for marine conservation Labeled audio data for ML model development arn:aws:s3:::acoustic-sandbox us-west-2 S3 Bucket https://github.com/orcasound/orcadata/wiki info@orcasound.net Orcasound Typical latency is 10-120 seconds https://creativecommons.org/licenses/by-nc-sa/4.0/ aws-pds, biodiversity, biology, coastal, conservation, deep learning, ecosystems, environmental, geospatial, labeled, machine learning, mapping, oceans, open source software, signal processing Oregon Health & Science University Chronic Neutrophilic Leukemia Dataset RNA-Seq Gene Expression Quantification arn:aws:s3:::gdc-ohsu-cnl-phs001799-2-open us-east-1 S3 Bucket https://www.ncbi.nlm.nih.gov/projects/gap/cgi-bin/study.cgi?study_id=phs001799.v dcf-support@datacommons.io [Center for Translational Data Science at The University of Chicago](https://ctd Genomic Data Commons (GDC) is source of truth for this dataset; GDC offers month NIH Genomic Data Sharing Policy: https://gdc.cancer.gov/access-data/data-access- aws-pds, cancer, genomic, life sciences -Overture Maps Foundation Open Map Data New File Notification arn:aws:sns:us-west-2:913550007193:overturemaps-us-west-2 us-west-2 SNS Topic Documentation is available at [docs.overturemaps.org](https://docs.overturemaps. info@overturemaps.org [Overture Maps Foundation](https://overturemaps.org) Monthly Overture data is licensed under the Community Database License Agreement Permiss aws-pds, geospatial, global, mapping, osm, parquet, transportation Overture Maps Foundation Open Map Data Overture Maps Foundation Data (GeoParquet) arn:aws:s3:::overturemaps-us-west-2/release/ us-west-2 S3 Bucket Documentation is available at [docs.overturemaps.org](https://docs.overturemaps. info@overturemaps.org [Overture Maps Foundation](https://overturemaps.org) Monthly Overture data is licensed under the Community Database License Agreement Permiss aws-pds, geospatial, global, mapping, osm, parquet, transportation -Oxford Nanopore Technologies Benchmark Datasets Using nanopore sequencing, researchers have directly identified DNA and RNA base arn:aws:s3:::ont-open-data/gm24385_mod_2021.09/extra_analysis/bonito_remora eu-west-1 S3 Bucket https://labs.epi2me.io/dataindex/ support@nanoporetech.com Oxford Nanopore Technologies Additional datasets will be added periodically. Updates and amendents will be ma Attribution-NonCommercial 4.0 International (CC BY-NC 4.0) https://creativecommo aws-pds, bioinformatics, biology, fastq, fast5, genomic, life sciences, Homo sapiens, whole genome sequencing False +Overture Maps Foundation Open Map Data New File Notification arn:aws:sns:us-west-2:913550007193:overturemaps-us-west-2 us-west-2 SNS Topic Documentation is available at [docs.overturemaps.org](https://docs.overturemaps. info@overturemaps.org [Overture Maps Foundation](https://overturemaps.org) Monthly Overture data is licensed under the Community Database License Agreement Permiss aws-pds, geospatial, global, mapping, osm, parquet, transportation Oxford Nanopore Technologies Benchmark Datasets CpG dinucleotides frequently occur in high-density clusters called CpG islands ( arn:aws:s3:::ont-open-data/rrms_2022.07 eu-west-1 S3 Bucket https://labs.epi2me.io/dataindex/ support@nanoporetech.com Oxford Nanopore Technologies Additional datasets will be added periodically. Updates and amendents will be ma Attribution-NonCommercial 4.0 International (CC BY-NC 4.0) https://creativecommo aws-pds, bioinformatics, biology, fastq, fast5, genomic, life sciences, Homo sapiens, whole genome sequencing False -Oxford Nanopore Technologies Benchmark Datasets Oxford Nanopore Open Datasets arn:aws:s3:::ont-open-data eu-west-1 S3 Bucket https://labs.epi2me.io/dataindex/ support@nanoporetech.com Oxford Nanopore Technologies Additional datasets will be added periodically. Updates and amendents will be ma Attribution-NonCommercial 4.0 International (CC BY-NC 4.0) https://creativecommo aws-pds, bioinformatics, biology, fastq, fast5, genomic, life sciences, Homo sapiens, whole genome sequencing False +Oxford Nanopore Technologies Benchmark Datasets Using nanopore sequencing, researchers have directly identified DNA and RNA base arn:aws:s3:::ont-open-data/gm24385_mod_2021.09/extra_analysis/bonito_remora eu-west-1 S3 Bucket https://labs.epi2me.io/dataindex/ support@nanoporetech.com Oxford Nanopore Technologies Additional datasets will be added periodically. Updates and amendents will be ma Attribution-NonCommercial 4.0 International (CC BY-NC 4.0) https://creativecommo aws-pds, bioinformatics, biology, fastq, fast5, genomic, life sciences, Homo sapiens, whole genome sequencing False Oxford Nanopore Technologies Benchmark Datasets Nanopore sequencing data of the Genome in a Bottle samples NA24385, NA24149, and arn:aws:s3:::ont-open-data/giab_lsk114_2022.12 eu-west-1 S3 Bucket https://labs.epi2me.io/dataindex/ support@nanoporetech.com Oxford Nanopore Technologies Additional datasets will be added periodically. Updates and amendents will be ma Attribution-NonCommercial 4.0 International (CC BY-NC 4.0) https://creativecommo aws-pds, bioinformatics, biology, fastq, fast5, genomic, life sciences, Homo sapiens, whole genome sequencing False +Oxford Nanopore Technologies Benchmark Datasets Oxford Nanopore Open Datasets arn:aws:s3:::ont-open-data eu-west-1 S3 Bucket https://labs.epi2me.io/dataindex/ support@nanoporetech.com Oxford Nanopore Technologies Additional datasets will be added periodically. Updates and amendents will be ma Attribution-NonCommercial 4.0 International (CC BY-NC 4.0) https://creativecommo aws-pds, bioinformatics, biology, fastq, fast5, genomic, life sciences, Homo sapiens, whole genome sequencing False Ozone Monitoring Instrument (OMI) / Aura NO2 Tropospheric Column Density S3 Bucket for OMI NO2 in Cloud-Optimized GeoTiff format arn:aws:s3:::omi-no2-nasa us-west-2 S3 Bucket https://disc.gsfc.nasa.gov/datasets/OMNO2d_003/summary binita.kc@nasa.gov NASA None There are no restrictions on the use of these data. aws-pds, earth observation, geospatial, satellite imagery, air quality, atmosphere, environmental PALSAR-2 ScanSAR CARD4L (L2.2) PALSAR-2 ScanSAR CARD4L arn:aws:s3:::jaxaalos2/palsar2/L2.2/Africa/ us-west-2 S3 Bucket https://www.eorc.jaxa.jp/ALOS/en/dataset/palsar2_l22_e.htm aproject@jaxa.jp [JAXA](https://www.jaxa.jp/) Every month after 42 days observed Data is available for free under the [terms of use](https://earth.jaxa.jp/policy aws-pds, agriculture, earth observation, satellite imagery, geospatial, natural resource, sustainability, disaster response, synthetic aperture radar, deafrica, stac, cog False PALSAR-2 ScanSAR Flooding in Rwanda (L2.1) PALSAR-2 ScanSAR L11 & L22 arn:aws:s3:::jaxaalos2/palsar2-scansar/Rwanda/ us-west-2 S3 Bucket https://www.eorc.jaxa.jp/ALOS/en/dataset/alos_open_and_free_e.htm, https://www.e aproject@jaxa.jp [JAXA](https://www.jaxa.jp/) As available. Data is available for free under the terms of use. aws-pds, agriculture, cog, deafrica, disaster response, earth observation, geospatial, natural resource, satellite imagery, stac, sustainability, synthetic aperture radar False @@ -958,51 +958,51 @@ PALSAR-2 ScanSAR Turkey & Syria Earthquake (L2.1 & L1.1) PALSAR-2 ScanSAR L11 & PASS: Perturb-and-Select Summarizer for Product Reviews A collection of summaries generated by PASS for the FewSum Product Reviews datas arn:aws:s3:::pass-summary-fewsum us-east-1 S3 Bucket https://pass-summary-fewsum.s3.amazonaws.com/README.md noved@amazon.com [Amazon](https://www.amazon.com/) Not updated This data is available for anyone to use under the terms of the CDLA-Sharing lic amazon.science, natural language processing, text analysis ['[pass_generated_summaries.jsonl](https://pass-summary-fewsum.s3.amazonaws.com/pass_gen_summaries_fewsum_amazon_val_test.jsonl)'] PD12M Image files arn:aws:s3:::pd12m us-west-2 S3 Bucket https://huggingface.co/datasets/Spawning/PD12M info@spawning.ai Spawning Data will be adjusted as infringing works are discovered, improved provenance is https://cdla.dev/permissive-2-0/ image processing, machine learning, media, art, deep learning, labeled PROJ datum grids Horizontal and vertical adjustment datasets us-east-1 CloudFront Distribution https://github.com/OSGeo/proj-datumgrid-geotiff proj@lists.osgeo.org [PROJ](https://proj.org) New grids are added when made available Per file. Under an Open Source Definition compliant license. Consult the READMEs aws-pds, geospatial, mapping cdn.proj.org -Pacific Ocean Sound Recordings original 256 kHz audio recordings year 2018 arn:aws:s3:::pacific-sound-256khz-2018 us-west-2 S3 Bucket https://docs.mbari.org/pacific-sound/ dcline@mbari.org [Monterey Bay Aquarium Research Institute](https://www.mbari.org/) daily CC-BY 4.0 aws-pds, acoustics, biodiversity, ecosystems, biology, marine mammals, oceans, climate, coastal, deep learning, machine learning, environmental, open source software +Pacific Ocean Sound Recordings original 256 kHz audio recordings year 2015 arn:aws:s3:::pacific-sound-256khz-2015 us-west-2 S3 Bucket https://docs.mbari.org/pacific-sound/ dcline@mbari.org [Monterey Bay Aquarium Research Institute](https://www.mbari.org/) daily CC-BY 4.0 aws-pds, acoustics, biodiversity, ecosystems, biology, marine mammals, oceans, climate, coastal, deep learning, machine learning, environmental, open source software +Pacific Ocean Sound Recordings machine learning models arn:aws:s3:::pacific-sound-models us-west-2 S3 Bucket https://docs.mbari.org/pacific-sound/ dcline@mbari.org [Monterey Bay Aquarium Research Institute](https://www.mbari.org/) daily CC-BY 4.0 aws-pds, acoustics, biodiversity, ecosystems, biology, marine mammals, oceans, climate, coastal, deep learning, machine learning, environmental, open source software Pacific Ocean Sound Recordings decimated 16 kHz audio recordings arn:aws:s3:::pacific-sound-16khz us-west-2 S3 Bucket https://docs.mbari.org/pacific-sound/ dcline@mbari.org [Monterey Bay Aquarium Research Institute](https://www.mbari.org/) daily CC-BY 4.0 aws-pds, acoustics, biodiversity, ecosystems, biology, marine mammals, oceans, climate, coastal, deep learning, machine learning, environmental, open source software -Pacific Ocean Sound Recordings original 256 kHz audio recordings year 2017 arn:aws:s3:::pacific-sound-256khz-2017 us-west-2 S3 Bucket https://docs.mbari.org/pacific-sound/ dcline@mbari.org [Monterey Bay Aquarium Research Institute](https://www.mbari.org/) daily CC-BY 4.0 aws-pds, acoustics, biodiversity, ecosystems, biology, marine mammals, oceans, climate, coastal, deep learning, machine learning, environmental, open source software -Pacific Ocean Sound Recordings original 256 kHz audio recordings year 2016 arn:aws:s3:::pacific-sound-256khz-2016 us-west-2 S3 Bucket https://docs.mbari.org/pacific-sound/ dcline@mbari.org [Monterey Bay Aquarium Research Institute](https://www.mbari.org/) daily CC-BY 4.0 aws-pds, acoustics, biodiversity, ecosystems, biology, marine mammals, oceans, climate, coastal, deep learning, machine learning, environmental, open source software -Pacific Ocean Sound Recordings original 256 kHz audio recordings year 2019 arn:aws:s3:::pacific-sound-256khz-2019 us-west-2 S3 Bucket https://docs.mbari.org/pacific-sound/ dcline@mbari.org [Monterey Bay Aquarium Research Institute](https://www.mbari.org/) daily CC-BY 4.0 aws-pds, acoustics, biodiversity, ecosystems, biology, marine mammals, oceans, climate, coastal, deep learning, machine learning, environmental, open source software -Pacific Ocean Sound Recordings original 256 kHz audio recordings year 2020 arn:aws:s3:::pacific-sound-256khz-2020 us-west-2 S3 Bucket https://docs.mbari.org/pacific-sound/ dcline@mbari.org [Monterey Bay Aquarium Research Institute](https://www.mbari.org/) daily CC-BY 4.0 aws-pds, acoustics, biodiversity, ecosystems, biology, marine mammals, oceans, climate, coastal, deep learning, machine learning, environmental, open source software Pacific Ocean Sound Recordings decimated 2 kHz audio recordings arn:aws:s3:::pacific-sound-2khz us-west-2 S3 Bucket https://docs.mbari.org/pacific-sound/ dcline@mbari.org [Monterey Bay Aquarium Research Institute](https://www.mbari.org/) daily CC-BY 4.0 aws-pds, acoustics, biodiversity, ecosystems, biology, marine mammals, oceans, climate, coastal, deep learning, machine learning, environmental, open source software -Pacific Ocean Sound Recordings original 256 kHz audio recordings year 2022 arn:aws:s3:::pacific-sound-256khz-2022 us-west-2 S3 Bucket https://docs.mbari.org/pacific-sound/ dcline@mbari.org [Monterey Bay Aquarium Research Institute](https://www.mbari.org/) daily CC-BY 4.0 aws-pds, acoustics, biodiversity, ecosystems, biology, marine mammals, oceans, climate, coastal, deep learning, machine learning, environmental, open source software -Pacific Ocean Sound Recordings original 256 kHz audio recordings year 2023 arn:aws:s3:::pacific-sound-256khz-2023 us-west-2 S3 Bucket https://docs.mbari.org/pacific-sound/ dcline@mbari.org [Monterey Bay Aquarium Research Institute](https://www.mbari.org/) daily CC-BY 4.0 aws-pds, acoustics, biodiversity, ecosystems, biology, marine mammals, oceans, climate, coastal, deep learning, machine learning, environmental, open source software -Pacific Ocean Sound Recordings original 256 kHz audio recordings year 2024 arn:aws:s3:::pacific-sound-256khz-2024 us-west-2 S3 Bucket https://docs.mbari.org/pacific-sound/ dcline@mbari.org [Monterey Bay Aquarium Research Institute](https://www.mbari.org/) daily CC-BY 4.0 aws-pds, acoustics, biodiversity, ecosystems, biology, marine mammals, oceans, climate, coastal, deep learning, machine learning, environmental, open source software Pacific Ocean Sound Recordings original 256 kHz audio recordings year 2025 arn:aws:s3:::pacific-sound-256khz-2025 us-west-2 S3 Bucket https://docs.mbari.org/pacific-sound/ dcline@mbari.org [Monterey Bay Aquarium Research Institute](https://www.mbari.org/) daily CC-BY 4.0 aws-pds, acoustics, biodiversity, ecosystems, biology, marine mammals, oceans, climate, coastal, deep learning, machine learning, environmental, open source software -Pacific Ocean Sound Recordings machine learning models arn:aws:s3:::pacific-sound-models us-west-2 S3 Bucket https://docs.mbari.org/pacific-sound/ dcline@mbari.org [Monterey Bay Aquarium Research Institute](https://www.mbari.org/) daily CC-BY 4.0 aws-pds, acoustics, biodiversity, ecosystems, biology, marine mammals, oceans, climate, coastal, deep learning, machine learning, environmental, open source software +Pacific Ocean Sound Recordings original 256 kHz audio recordings year 2023 arn:aws:s3:::pacific-sound-256khz-2023 us-west-2 S3 Bucket https://docs.mbari.org/pacific-sound/ dcline@mbari.org [Monterey Bay Aquarium Research Institute](https://www.mbari.org/) daily CC-BY 4.0 aws-pds, acoustics, biodiversity, ecosystems, biology, marine mammals, oceans, climate, coastal, deep learning, machine learning, environmental, open source software +Pacific Ocean Sound Recordings original 256 kHz audio recordings year 2022 arn:aws:s3:::pacific-sound-256khz-2022 us-west-2 S3 Bucket https://docs.mbari.org/pacific-sound/ dcline@mbari.org [Monterey Bay Aquarium Research Institute](https://www.mbari.org/) daily CC-BY 4.0 aws-pds, acoustics, biodiversity, ecosystems, biology, marine mammals, oceans, climate, coastal, deep learning, machine learning, environmental, open source software Pacific Ocean Sound Recordings original 256 kHz audio recordings year 2021 arn:aws:s3:::pacific-sound-256khz-2021 us-west-2 S3 Bucket https://docs.mbari.org/pacific-sound/ dcline@mbari.org [Monterey Bay Aquarium Research Institute](https://www.mbari.org/) daily CC-BY 4.0 aws-pds, acoustics, biodiversity, ecosystems, biology, marine mammals, oceans, climate, coastal, deep learning, machine learning, environmental, open source software -Pacific Ocean Sound Recordings original 256 kHz audio recordings year 2015 arn:aws:s3:::pacific-sound-256khz-2015 us-west-2 S3 Bucket https://docs.mbari.org/pacific-sound/ dcline@mbari.org [Monterey Bay Aquarium Research Institute](https://www.mbari.org/) daily CC-BY 4.0 aws-pds, acoustics, biodiversity, ecosystems, biology, marine mammals, oceans, climate, coastal, deep learning, machine learning, environmental, open source software +Pacific Ocean Sound Recordings original 256 kHz audio recordings year 2020 arn:aws:s3:::pacific-sound-256khz-2020 us-west-2 S3 Bucket https://docs.mbari.org/pacific-sound/ dcline@mbari.org [Monterey Bay Aquarium Research Institute](https://www.mbari.org/) daily CC-BY 4.0 aws-pds, acoustics, biodiversity, ecosystems, biology, marine mammals, oceans, climate, coastal, deep learning, machine learning, environmental, open source software +Pacific Ocean Sound Recordings original 256 kHz audio recordings year 2019 arn:aws:s3:::pacific-sound-256khz-2019 us-west-2 S3 Bucket https://docs.mbari.org/pacific-sound/ dcline@mbari.org [Monterey Bay Aquarium Research Institute](https://www.mbari.org/) daily CC-BY 4.0 aws-pds, acoustics, biodiversity, ecosystems, biology, marine mammals, oceans, climate, coastal, deep learning, machine learning, environmental, open source software +Pacific Ocean Sound Recordings original 256 kHz audio recordings year 2018 arn:aws:s3:::pacific-sound-256khz-2018 us-west-2 S3 Bucket https://docs.mbari.org/pacific-sound/ dcline@mbari.org [Monterey Bay Aquarium Research Institute](https://www.mbari.org/) daily CC-BY 4.0 aws-pds, acoustics, biodiversity, ecosystems, biology, marine mammals, oceans, climate, coastal, deep learning, machine learning, environmental, open source software +Pacific Ocean Sound Recordings original 256 kHz audio recordings year 2017 arn:aws:s3:::pacific-sound-256khz-2017 us-west-2 S3 Bucket https://docs.mbari.org/pacific-sound/ dcline@mbari.org [Monterey Bay Aquarium Research Institute](https://www.mbari.org/) daily CC-BY 4.0 aws-pds, acoustics, biodiversity, ecosystems, biology, marine mammals, oceans, climate, coastal, deep learning, machine learning, environmental, open source software +Pacific Ocean Sound Recordings original 256 kHz audio recordings year 2016 arn:aws:s3:::pacific-sound-256khz-2016 us-west-2 S3 Bucket https://docs.mbari.org/pacific-sound/ dcline@mbari.org [Monterey Bay Aquarium Research Institute](https://www.mbari.org/) daily CC-BY 4.0 aws-pds, acoustics, biodiversity, ecosystems, biology, marine mammals, oceans, climate, coastal, deep learning, machine learning, environmental, open source software +Pacific Ocean Sound Recordings original 256 kHz audio recordings year 2024 arn:aws:s3:::pacific-sound-256khz-2024 us-west-2 S3 Bucket https://docs.mbari.org/pacific-sound/ dcline@mbari.org [Monterey Bay Aquarium Research Institute](https://www.mbari.org/) daily CC-BY 4.0 aws-pds, acoustics, biodiversity, ecosystems, biology, marine mammals, oceans, climate, coastal, deep learning, machine learning, environmental, open source software Pan-STARRS PS1 Survey PS1 DR1 and DR2 image files arn:aws:s3:::stpubdata/ps1 us-east-1 S3 Bucket https://outerspace.stsci.edu/display/PANSTARRS/ archive@stsci.edu [Space Telescope Science Institute](http://www.stsci.edu/) Never STScI hereby grants the non-exclusive, royalty-free, non-transferable, worldwide aws-pds, astronomy False -Pancreatic Cancer Organoid Profiling RNA-Seq Gene Expression Quantification arn:aws:s3:::gdc-organoid-pancreatic-phs001611-2-open us-east-1 S3 Bucket https://www.ncbi.nlm.nih.gov/projects/gap/cgi-bin/study.cgi?study_id=phs001611.v dcf-support@datacommons.io [Center for Translational Data Science at The University of Chicago](https://ctd Genomic Data Commons (GDC) is source of truth for this dataset; GDC offers month NIH Genomic Data Sharing Policy: https://gdc.cancer.gov/access-data/data-access- aws-pds, cancer, genetic, genomic, transcriptomics, whole genome sequencing, STRIDES, life sciences Pancreatic Cancer Organoid Profiling WGS/WXS/RNA-Seq Aligned Reads, WXS Annotated Somatic Mutation, WXS Raw Somatic M arn:aws:s3:::gdc-organoid-pancreatic-phs001611-2-controlled us-east-1 S3 Bucket https://www.ncbi.nlm.nih.gov/projects/gap/cgi-bin/study.cgi?study_id=phs001611.v dcf-support@datacommons.io [Center for Translational Data Science at The University of Chicago](https://ctd Genomic Data Commons (GDC) is source of truth for this dataset; GDC offers month NIH Genomic Data Sharing Policy: https://gdc.cancer.gov/access-data/data-access- aws-pds, cancer, genetic, genomic, transcriptomics, whole genome sequencing, STRIDES, life sciences https://www.ncbi.nlm.nih.gov/projects/gap/cgi-bin/study.cgi?study_id=phs001611.v1.p1 +Pancreatic Cancer Organoid Profiling RNA-Seq Gene Expression Quantification arn:aws:s3:::gdc-organoid-pancreatic-phs001611-2-open us-east-1 S3 Bucket https://www.ncbi.nlm.nih.gov/projects/gap/cgi-bin/study.cgi?study_id=phs001611.v dcf-support@datacommons.io [Center for Translational Data Science at The University of Chicago](https://ctd Genomic Data Commons (GDC) is source of truth for this dataset; GDC offers month NIH Genomic Data Sharing Policy: https://gdc.cancer.gov/access-data/data-access- aws-pds, cancer, genetic, genomic, transcriptomics, whole genome sequencing, STRIDES, life sciences PersonPath22 Source data arn:aws:s3:::tracking-dataset-eccv-2022 us-east-2 S3 Bucket https://amazon-science.github.io/tracking-dataset/personpath22.html Post any questions to [re:Post](https://repost.aws/tags/questions/TApd0Wl5P8S9O6 [Amazon Web Services](https://aws.amazon.com/) Periodically Creative Commons Attribution-NonCommercial 4.0 International Public License (CC amazon.science, computer vision Phrase Clustering Dataset (PCD) Phsrase Clustering Dataset (PCD) arn:aws:s3:::amazon-phrase-clustering us-west-2 S3 Bucket https://amazon-phrase-clustering.s3.amazonaws.com/readme.md Post any questions to [re:Post](https://repost.aws/tags/questions/TApd0Wl5P8S9O6 [Amazon](https://www.amazon.com/) Not updated This data is available for anyone to use under the terms of the CDLA-permissive amazon.science, natural language processing, json ['[phrase-clustering-dataset.json](https://amazon-phrase-clustering.s3.amazonaws.com/phrase-clustering-dataset.json)'] Physionet https://s3amazonawscom/physionet-pds/indexhtml arn:aws:s3:::physionet-pds us-east-1 S3 Bucket https://physionet.org/ contact@physionet.org [MIT Laboratory for Computational Physiology](https://lcp.mit.edu/) Not updated PhysioBank databases are made available under the ODC Public Domain Dedication a aws-pds, biology, life sciences Platinum Pedigree https://githubcom/Platinum-Pedigree-Consortium/Platinum-Pedigree-Datasets arn:aws:s3:::platinum-pedigree-data us-west-1 S3 Bucket https://github.com/Platinum-Pedigree-Consortium https://github.com/Platinum-Pedigree-Consortium/Platinum-Pedigree-Datasets/issue Platinum Pedigree Consortium As needed [CC BY 4.0](https://creativecommons.org/licenses/by/4.0/) genomic, genotyping, long read sequencing, bioinformatics, Homo sapiens, life sciences, whole genome sequencing Pohang Canal Dataset: A Multimodal Maritime Dataset for Autonomous Navigation in Restricted Waters Pohang Canal dataset arn:aws:s3:::pohang-canal-dataset us-west-2 S3 Bucket https://sites.google.com/view/pohang-canal-dataset/home morin-lab@kaist.ac.kr [MORIN](http://morin.kaist.ac.kr) Not updated [CC BY-NC 4.0](https://creativecommons.org/licenses/by-nc/4.0/) aws-pds, autonomous vehicles, marine navigation, robotics, computer vision, lidar PoroTomo PoroTomo Nodal Seismometer Sweep Data arn:aws:s3:::nrel-pds-porotomo/Nodal/nodal_sac_sweep/ us-west-2 S3 Bucket https://github.com/openEDI/documentation/blob/master/PoroTomo/PoroTomo.md Thomas Coleman (thomas.coleman@silixa.com) [National Renewable Energy Laboratory](https://www.nrel.gov/) As needed Creative Commons Attribution 3.0 United States License aws-pds, geothermal, seismology, image processing, geospatial ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo&prefix=Nodal%2Fnodal_sac_sweep%2F)'] -PoroTomo PoroTomo Nodal Seismometer Field Notes and Metadata arn:aws:s3:::nrel-pds-porotomo/Nodal/nodal_metadata/ us-west-2 S3 Bucket https://github.com/openEDI/documentation/blob/master/PoroTomo/PoroTomo.md Thomas Coleman (thomas.coleman@silixa.com) [National Renewable Energy Laboratory](https://www.nrel.gov/) As needed Creative Commons Attribution 3.0 United States License aws-pds, geothermal, seismology, image processing, geospatial ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo&prefix=Nodal%2Fnodal_metadata%2F)'] -PoroTomo PoroTomo Vertical Distributed Acoustic Sensing (DASV) Data in SEG-Y format arn:aws:s3:::nrel-pds-porotomo/DAS/SEG-Y/DASV/ us-west-2 S3 Bucket https://github.com/openEDI/documentation/blob/master/PoroTomo/PoroTomo.md Thomas Coleman (thomas.coleman@silixa.com) [National Renewable Energy Laboratory](https://www.nrel.gov/) As needed Creative Commons Attribution 3.0 United States License aws-pds, geothermal, seismology, image processing, geospatial ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo&prefix=DAS%2FSEG-Y%2FDASV%2F)'] PoroTomo PoroTomo Datasets arn:aws:s3:::nrel-pds-porotomo/ us-west-2 S3 Bucket https://github.com/openEDI/documentation/blob/master/PoroTomo/PoroTomo.md Thomas Coleman (thomas.coleman@silixa.com) [National Renewable Energy Laboratory](https://www.nrel.gov/) As needed Creative Commons Attribution 3.0 United States License aws-pds, geothermal, seismology, image processing, geospatial ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo)'] -PoroTomo PoroTomo Horizontal Distributed Acoustic Sensing (DASH) Data in HDF5 format arn:aws:s3:::nrel-pds-porotomo/DAS/H5/DASH/ us-west-2 S3 Bucket https://github.com/openEDI/documentation/blob/master/PoroTomo/PoroTomo.md Thomas Coleman (thomas.coleman@silixa.com) [National Renewable Energy Laboratory](https://www.nrel.gov/) As needed Creative Commons Attribution 3.0 United States License aws-pds, geothermal, seismology, image processing, geospatial ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo&prefix=DAS%2FH5%2FDASH%2F)'] +PoroTomo PoroTomo Horizontal Distributed Acoustic Sensing (DASH) Data in SEG-Y format arn:aws:s3:::nrel-pds-porotomo/DAS/SEG-Y/DASH/ us-west-2 S3 Bucket https://github.com/openEDI/documentation/blob/master/PoroTomo/PoroTomo.md Thomas Coleman (thomas.coleman@silixa.com) [National Renewable Energy Laboratory](https://www.nrel.gov/) As needed Creative Commons Attribution 3.0 United States License aws-pds, geothermal, seismology, image processing, geospatial ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo&prefix=DAS%2FSEG-Y%2FDASH%2F)'] PoroTomo PoroTomo Horizontal Distributed Acoustic Sensing (DASH) Data Resampled in Time M arn:aws:s3:::nrel-pds-porotomo/DAS/SEG-Y/DASH/Resampled/ us-west-2 S3 Bucket https://github.com/openEDI/documentation/blob/master/PoroTomo/PoroTomo.md Thomas Coleman (thomas.coleman@silixa.com) [National Renewable Energy Laboratory](https://www.nrel.gov/) As needed Creative Commons Attribution 3.0 United States License aws-pds, geothermal, seismology, image processing, geospatial ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo&prefix=DAS%2FSEG-Y%2FDASH%2FResampled%2F)'] +PoroTomo PoroTomo Vertical Distributed Acoustic Sensing (DASV) Data in SEG-Y format arn:aws:s3:::nrel-pds-porotomo/DAS/SEG-Y/DASV/ us-west-2 S3 Bucket https://github.com/openEDI/documentation/blob/master/PoroTomo/PoroTomo.md Thomas Coleman (thomas.coleman@silixa.com) [National Renewable Energy Laboratory](https://www.nrel.gov/) As needed Creative Commons Attribution 3.0 United States License aws-pds, geothermal, seismology, image processing, geospatial ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo&prefix=DAS%2FSEG-Y%2FDASV%2F)'] +PoroTomo PoroTomo Horizontal Distributed Acoustic Sensing (DASH) Data in HDF5 format arn:aws:s3:::nrel-pds-porotomo/DAS/H5/DASH/ us-west-2 S3 Bucket https://github.com/openEDI/documentation/blob/master/PoroTomo/PoroTomo.md Thomas Coleman (thomas.coleman@silixa.com) [National Renewable Energy Laboratory](https://www.nrel.gov/) As needed Creative Commons Attribution 3.0 United States License aws-pds, geothermal, seismology, image processing, geospatial ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo&prefix=DAS%2FH5%2FDASH%2F)'] PoroTomo PoroTomo Vertical Distributed Acoustic Sensing (DASV) Data in HDF5 format arn:aws:s3:::nrel-pds-porotomo/DAS/H5/DASV/ us-west-2 S3 Bucket https://github.com/openEDI/documentation/blob/master/PoroTomo/PoroTomo.md Thomas Coleman (thomas.coleman@silixa.com) [National Renewable Energy Laboratory](https://www.nrel.gov/) As needed Creative Commons Attribution 3.0 United States License aws-pds, geothermal, seismology, image processing, geospatial ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo&prefix=DAS%2FH5%2FDASV%2F)'] PoroTomo HSDS PoroTomo domains arn:aws:s3:::nrel-pds-hsds/nrel/porotomo/ us-west-2 S3 Bucket https://github.com/openEDI/documentation/blob/master/PoroTomo/PoroTomo.md Thomas Coleman (thomas.coleman@silixa.com) [National Renewable Energy Laboratory](https://www.nrel.gov/) As needed Creative Commons Attribution 3.0 United States License aws-pds, geothermal, seismology, image processing, geospatial ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-hsds&prefix=nrel%2Fporotomo%2F)'] -PoroTomo PoroTomo Horizontal Distributed Acoustic Sensing (DASH) Data in SEG-Y format arn:aws:s3:::nrel-pds-porotomo/DAS/SEG-Y/DASH/ us-west-2 S3 Bucket https://github.com/openEDI/documentation/blob/master/PoroTomo/PoroTomo.md Thomas Coleman (thomas.coleman@silixa.com) [National Renewable Energy Laboratory](https://www.nrel.gov/) As needed Creative Commons Attribution 3.0 United States License aws-pds, geothermal, seismology, image processing, geospatial ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo&prefix=DAS%2FSEG-Y%2FDASH%2F)'] PoroTomo PoroTomo Nodal Seismometer Continuous Data arn:aws:s3:::nrel-pds-porotomo/Nodal/nodal_sac/ us-west-2 S3 Bucket https://github.com/openEDI/documentation/blob/master/PoroTomo/PoroTomo.md Thomas Coleman (thomas.coleman@silixa.com) [National Renewable Energy Laboratory](https://www.nrel.gov/) As needed Creative Commons Attribution 3.0 United States License aws-pds, geothermal, seismology, image processing, geospatial ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo&prefix=Nodal%2Fnodal_sac%2F)'] +PoroTomo PoroTomo Nodal Seismometer Field Notes and Metadata arn:aws:s3:::nrel-pds-porotomo/Nodal/nodal_metadata/ us-west-2 S3 Bucket https://github.com/openEDI/documentation/blob/master/PoroTomo/PoroTomo.md Thomas Coleman (thomas.coleman@silixa.com) [National Renewable Energy Laboratory](https://www.nrel.gov/) As needed Creative Commons Attribution 3.0 United States License aws-pds, geothermal, seismology, image processing, geospatial ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-porotomo&prefix=Nodal%2Fnodal_metadata%2F)'] Poseidon 3D Seismic, Australia Poseidon 3D Seismic MDIO volumes and Reports arn:aws:s3:::tgs-opendata-poseidon us-west-2 S3 Bucket TBD For any questions regarding the datasets and MDIO, email the TGS Open Data Team [TGS](https://www.tgs.com) Dataset is static. CC BY 4.0 seismology, geophysics, exploration ['[Browse Bucket](https://tgs-opendata-poseidon.s3.amazonaws.com/index.html)'] Pre- and post-purchase product questions S3 bucket with dataset arn:aws:s3:::pre-post-purchase-questions us-east-1 S3 Bucket https://pre-post-purchase-questions.s3.amazonaws.com/README.txt litalku@amazon.com [Amazon](https://www.amazon.com/) Not currently being updated [Apache-2.0](https://www.apache.org/licenses/LICENSE-2.0) amazon.science, natural language processing, machine learning ['[PrePostQuestions.csv](https://pre-post-purchase-questions.s3.amazonaws.com/PrePostQuestions.csv)'] Prefeitura Municipal de São Paulo (PMSP) LiDAR Point Cloud São Paulo city's 3D LiDAR - Entwine Point Tiles arn:aws:s3:::ept-m3dc-pmsp sa-east-1 S3 Bucket https://github.com/geoinfo-smdu/M3DC geosampa@prefeitura.sp.gov.br [GeoSampa - o mapa digital da cidade de São Paulo](http://geosampa.prefeitura.sp Local survey executed by demand generates new data as local point clouds. [GNU General Public License v3.0](https://www.gnu.org/licenses/gpl-3.0.html) cities, land, lidar, urban, geospatial, elevation, mapping, aws-pds Prefeitura Municipal de São Paulo (PMSP) LiDAR Point Cloud São Paulo city's 3D LiDAR - LAZ Files arn:aws:s3:::laz-m3dc-pmsp sa-east-1 S3 Bucket https://github.com/geoinfo-smdu/M3DC geosampa@prefeitura.sp.gov.br [GeoSampa - o mapa digital da cidade de São Paulo](http://geosampa.prefeitura.sp Local survey executed by demand generates new data as local point clouds. [GNU General Public License v3.0](https://www.gnu.org/licenses/gpl-3.0.html) cities, land, lidar, urban, geospatial, elevation, mapping, aws-pds Product Comparison Dataset for Online Shopping Product Comparison Dataset for Online Shopping arn:aws:s3:::prod-comp-shopping-dataset us-west-2 S3 Bucket https://prod-comp-shopping-dataset.s3.us-west-2.amazonaws.com/README.md Post any questions to [re:Post](https://repost.aws/tags/questions/TApd0Wl5P8S9O6 [Amazon](https://www.amazon.com/) None [CC-BY-SA 4.0](https://creativecommons.org/licenses/by-sa/4.0/) product comparison, online shopping, amazon.science, natural language processing, machine learning ['[final_prodcomp_dataset_cleaned.tsv](https://prod-comp-shopping-dataset.s3.us-west-2.amazonaws.com/final_prodcomp_dataset_cleaned.tsv)'] -Protein Data Bank 3D Structural Biology Data Historical snapshots of archival datasets from 2005 onwards Snapshots are gener arn:aws:s3:::pdbsnapshots us-west-2 S3 Bucket https://www.wwpdb.org/documentation/file-format https://www.wwpdb.org/about/contact [Worldwide Protein Data Bank Partnership](wwpdb.org) New and updated data files are published weekly and released on Wednesdays 0:00 https://creativecommons.org/publicdomain/zero/1.0/ aws-pds, amino acid, archives, bioinformatics, biomolecular modeling, cell biology, chemical biology, COVID-19, electron microscopy, electron tomography, enzyme, life sciences, molecule, nuclear magnetic resonance, pharmaceutical, protein, protein template, SARS-CoV-2, structural biology, x-ray crystallography ['[Browse Bucket](https://pdbsnapshots.s3.us-west-2.amazonaws.com/index.html)'] Protein Data Bank 3D Structural Biology Data Globally cached distribution of the dataset Web frontend also available to brow us-west-2 CloudFront Distribution https://www.wwpdb.org/documentation/file-format https://www.wwpdb.org/about/contact [Worldwide Protein Data Bank Partnership](wwpdb.org) New and updated data files are published weekly and released on Wednesdays 0:00 https://creativecommons.org/publicdomain/zero/1.0/ aws-pds, amino acid, archives, bioinformatics, biomolecular modeling, cell biology, chemical biology, COVID-19, electron microscopy, electron tomography, enzyme, life sciences, molecule, nuclear magnetic resonance, pharmaceutical, protein, protein template, SARS-CoV-2, structural biology, x-ray crystallography ['[Browse Dataset](https://s3.rcsb.org)'] +Protein Data Bank 3D Structural Biology Data Historical snapshots of archival datasets from 2005 onwards Snapshots are gener arn:aws:s3:::pdbsnapshots us-west-2 S3 Bucket https://www.wwpdb.org/documentation/file-format https://www.wwpdb.org/about/contact [Worldwide Protein Data Bank Partnership](wwpdb.org) New and updated data files are published weekly and released on Wednesdays 0:00 https://creativecommons.org/publicdomain/zero/1.0/ aws-pds, amino acid, archives, bioinformatics, biomolecular modeling, cell biology, chemical biology, COVID-19, electron microscopy, electron tomography, enzyme, life sciences, molecule, nuclear magnetic resonance, pharmaceutical, protein, protein template, SARS-CoV-2, structural biology, x-ray crystallography ['[Browse Bucket](https://pdbsnapshots.s3.us-west-2.amazonaws.com/index.html)'] Provision of Web-Scale Parallel Corpora for Official European Languages (ParaCrawl) Parallel Corpora to/from English for all official EU languages arn:aws:s3:::web-language-models us-east-1 S3 Bucket https://paracrawl.eu/releases.html For questions regarding the datasets contact Kenneth Heafield, email kheafiel@in [ParaCrawl](https://paracrawl.eu) New data is added according to ParaCrawl release schedule. "Creative Commons CC0 license (""no rights reserved"")." aws-pds, machine translation, natural language processing -PubSeq - Public Sequence Resource Pubseq output data (Arvados Keep) arn:aws:s3:::pubseq-output-data us-east-2 S3 Bucket https://covid19.genenetwork.org/about https://covid19.genenetwork.org/contact [UTHSC GeneNetwork](https://covid19.genenetwork.org/) Rolling dataset. Creative Commons Attribution 4.0 International (CC BY 4.0) unless otherwise spec aws-pds, bam, bioinformatics, biology, coronavirus, COVID-19, fasta, fastq, fast5, genetic, genomic, health, json, life sciences, long read sequencing, open source software, MERS, metadata, medicine, RDF, SARS, SARS-CoV-2, SPARQL ['[Arvados download](https://covid19.genenetwork.org/download)'] PubSeq - Public Sequence Resource PubSeq submitted datasets (FASTA and JSON metadata) arn:aws:s3:::pubseq-datasets us-east-2 S3 Bucket https://covid19.genenetwork.org/about https://covid19.genenetwork.org/contact [UTHSC GeneNetwork](https://covid19.genenetwork.org/) Rolling dataset. Creative Commons Attribution 4.0 International (CC BY 4.0) unless otherwise spec aws-pds, bam, bioinformatics, biology, coronavirus, COVID-19, fasta, fastq, fast5, genetic, genomic, health, json, life sciences, long read sequencing, open source software, MERS, metadata, medicine, RDF, SARS, SARS-CoV-2, SPARQL ['[Browse Bucket](https://pubseq-datasets.s3.amazonaws.com/)'] +PubSeq - Public Sequence Resource Pubseq output data (Arvados Keep) arn:aws:s3:::pubseq-output-data us-east-2 S3 Bucket https://covid19.genenetwork.org/about https://covid19.genenetwork.org/contact [UTHSC GeneNetwork](https://covid19.genenetwork.org/) Rolling dataset. Creative Commons Attribution 4.0 International (CC BY 4.0) unless otherwise spec aws-pds, bam, bioinformatics, biology, coronavirus, COVID-19, fasta, fastq, fast5, genetic, genomic, health, json, life sciences, long read sequencing, open source software, MERS, metadata, medicine, RDF, SARS, SARS-CoV-2, SPARQL ['[Arvados download](https://covid19.genenetwork.org/download)'] Public Utility Data Liberation Project All PUDL data outputs arn:aws:s3:::pudl.catalyst.coop us-west-2 S3 Bucket You can download the [data directly](https://catalystcoop-pudl.readthedocs.io/en For general questions or feedback about the data, create an GitHub issue or disc [Catalyst Cooperative](https://catalyst.coop/) The federal agencies that publish the raw data PUDL processes release new data, The PUDL data and documentation are published under the [Creative Commons Attrib aws-pds, climate, climate model, energy, environmental, government records, infrastructure, open source software, electricity, energy modeling, utilities -PyEnvs and CallArgs CallArgs arn:aws:s3:::pyenvs-and-callargs/callargs/ us-west-2 S3 Bucket https://github.com/amazon-research/function-call-argument-completion Post any questions to [re:Post](https://repost.aws/tags/questions/TApd0Wl5P8S9O6 Amazon None Planned Please note that while we are providing this aggregation of code snippets unlice machine learning, code completion PyEnvs and CallArgs PyEnvs arn:aws:s3:::pyenvs-and-callargs/pyenvs/ us-west-2 S3 Bucket https://github.com/amazon-research/function-call-argument-completion Post any questions to [re:Post](https://repost.aws/tags/questions/TApd0Wl5P8S9O6 Amazon None Planned Please note that while we are providing this aggregation of code snippets unlice machine learning, code completion +PyEnvs and CallArgs CallArgs arn:aws:s3:::pyenvs-and-callargs/callargs/ us-west-2 S3 Bucket https://github.com/amazon-research/function-call-argument-completion Post any questions to [re:Post](https://repost.aws/tags/questions/TApd0Wl5P8S9O6 Amazon None Planned Please note that while we are providing this aggregation of code snippets unlice machine learning, code completion QIIME 2 Tutorial Data Source for rendered documentation and tutorial datasets for the QIIME 2 project arn:aws:s3:::qiime2-data us-west-2 S3 Bucket https://use.qiime2.org https://forum.qiime2.org Caporaso Lab Twice per year BSD 3-Clause License aws-pds, bioinformatics, biology, ecosystems, environmental, genetic, genomic, health, microbiome, metagenomics, life sciences Quoref Project data files in a public bucket arn:aws:s3:::ai2-public-datasets us-west-2 S3 Bucket https://allenai.org/data/quoref info@allenai.org [Allen Institute for AI](https://allenai.org) Not updated [CC BY](https://creativecommons.org/licenses/by/4.0) aws-pds, machine learning, natural language processing RACECAR Dataset The RACECAR dataset is the first open dataset for full-scale and high-speed auto arn:aws:s3:::racecar-dataset us-west-2 S3 Bucket https://github.com/linklab-uva/RACECAR_DATA Prof. Madhur Behl (madhur.behl@viginia.edu) Amar Kulkarni (ark8su@virginia.edu) This dataset was constructed during a single racing season (2021-22). Future sea Creative Commons Attribution-NonCommercial 4.0 International Public License [(CC aws-pds, autonomous vehicles, autonomous racing, robotics, computer vision, perception, lidar, radar, GNSS, image processing, localization, object detection, object tracking @@ -1026,10 +1026,10 @@ Reference data for HiFi human WGS HiFi Human WGS Reference data arn:aws:s3:::pac Refgenie reference genome assets Refgenie S3 Bucket arn:aws:s3:::awspds.refgenie.databio.org us-east-1 S3 Bucket http://refgenie.databio.org https://github.com/databio/refgenie/issues Sheffield lab at the University of Virginia As new data becomes available (roughly quarterly) Public domain aws-pds, biology, bioinformatics, genetic, genomic, infrastructure, life sciences, single-cell transcriptomics, transcriptomics, whole genome sequencing Registry of Open Data on AWS SNS topic for object create events arn:aws:sns:us-east-1:652627389412:roda-object_created us-east-1 SNS Topic https://github.com/awslabs/open-data-registry#how-are-datasets-added-to-the-regi opendata@amazon.com [Amazon Web Services](https://aws.amazon.com/) Automatically when new datasets are added [Apache-2.0](https://www.apache.org/licenses/LICENSE-2.0) amazon.science, json, metadata Registry of Open Data on AWS Registry of Open Data on AWS arn:aws:s3:::registry.opendata.aws/roda/ndjson/ us-east-1 S3 Bucket https://github.com/awslabs/open-data-registry#how-are-datasets-added-to-the-regi opendata@amazon.com [Amazon Web Services](https://aws.amazon.com/) Automatically when new datasets are added [Apache-2.0](https://www.apache.org/licenses/LICENSE-2.0) amazon.science, json, metadata +SILAM Air Quality Surface NetCDF files arn:aws:s3:::fmi-opendata-silam-surface-netcdf eu-west-1 S3 Bucket http://en.ilmatieteenlaitos.fi/open-data-on-aws-s3 avoin-data@fmi.fi [Finnish Meteorological Institute](https://www.ilmatieteenlaitos.fi/) 1 time a day Creative Commons Attribution 4.0 International (CC BY 4.0) aws-pds, earth observation, climate, weather, air quality, meteorological ['[Browse Bucket](https://fmi-opendata-silam-surface-netcdf.s3.amazonaws.com/index.html)'] SILAM Air Quality Surface Zarr files arn:aws:s3:::fmi-opendata-silam-surface-zarr eu-west-1 S3 Bucket http://en.ilmatieteenlaitos.fi/open-data-on-aws-s3 avoin-data@fmi.fi [Finnish Meteorological Institute](https://www.ilmatieteenlaitos.fi/) 1 time a day Creative Commons Attribution 4.0 International (CC BY 4.0) aws-pds, earth observation, climate, weather, air quality, meteorological ['[Browse Bucket](https://fmi-opendata-silam-surface-zarr.s3.amazonaws.com/index.html)'] -SILAM Air Quality Notifications for new zarr surface data arn:aws:sns:eu-west-1:916174725480:new-fmi-opendata-silam-surface-zarr eu-west-1 SNS Topic http://en.ilmatieteenlaitos.fi/open-data-on-aws-s3 avoin-data@fmi.fi [Finnish Meteorological Institute](https://www.ilmatieteenlaitos.fi/) 1 time a day Creative Commons Attribution 4.0 International (CC BY 4.0) aws-pds, earth observation, climate, weather, air quality, meteorological SILAM Air Quality Notifications for new netcdf surface data arn:aws:sns:eu-west-1:916174725480:new-fmi-opendata-silam-surface-netcdf eu-west-1 SNS Topic http://en.ilmatieteenlaitos.fi/open-data-on-aws-s3 avoin-data@fmi.fi [Finnish Meteorological Institute](https://www.ilmatieteenlaitos.fi/) 1 time a day Creative Commons Attribution 4.0 International (CC BY 4.0) aws-pds, earth observation, climate, weather, air quality, meteorological -SILAM Air Quality Surface NetCDF files arn:aws:s3:::fmi-opendata-silam-surface-netcdf eu-west-1 S3 Bucket http://en.ilmatieteenlaitos.fi/open-data-on-aws-s3 avoin-data@fmi.fi [Finnish Meteorological Institute](https://www.ilmatieteenlaitos.fi/) 1 time a day Creative Commons Attribution 4.0 International (CC BY 4.0) aws-pds, earth observation, climate, weather, air quality, meteorological ['[Browse Bucket](https://fmi-opendata-silam-surface-netcdf.s3.amazonaws.com/index.html)'] +SILAM Air Quality Notifications for new zarr surface data arn:aws:sns:eu-west-1:916174725480:new-fmi-opendata-silam-surface-zarr eu-west-1 SNS Topic http://en.ilmatieteenlaitos.fi/open-data-on-aws-s3 avoin-data@fmi.fi [Finnish Meteorological Institute](https://www.ilmatieteenlaitos.fi/) 1 time a day Creative Commons Attribution 4.0 International (CC BY 4.0) aws-pds, earth observation, climate, weather, air quality, meteorological SILO climate data on AWS SILO open data arn:aws:s3:::silo-open-data ap-southeast-2 S3 Bucket https://www.longpaddock.qld.gov.au/silo/gridded-data https://www.longpaddock.qld.gov.au/silo/contact-us Queensland Government Daily SILO datasets are constructed by the [Queensland Government](http://www.qld.gov. aws-pds, agriculture, climate, earth observation, environmental, meteorological, model, sustainability, water, weather SMN Hi-Res Weather Forecast over Argentina WRF SMN data arn:aws:s3:::smn-ar-wrf us-west-2 S3 Bucket General information, tutorials and examples:[https://odp-aws-smn.github.io/docum For any questions regarding the data set or any general questions, you can conta [SMN](http://www.smn.gov.ar/) New data is added as soon as it's available. Two forecast cycles a day initializ [Creative Commons Attribution 2.5 Argentina License](https://creativecommons.org aws-pds, earth observation, natural resource, weather, meteorological ['[Browse Bucket](https://smn-ar-wrf.s3.amazonaws.com/index.html)'] SPARTAN Data All data products (PM25, aerosol chemical components, scattering) provided by S arn:aws:s3:::spartan-cloud us-west-2 S3 Bucket https://www.spartan-network.org/data SPARTAN.PM25@gmail.com The [Atmospheric Composition Analysis Group](https://sites.wustl.edu/acag/) New measurement or estimation products will be added when available, usually mul SPARTAN data is licensed under [CC BY 4.0](https://creativecommons.org/licenses/ aws-pds, environmental, air quality @@ -1041,12 +1041,13 @@ Safecast New air and radiation measurement payloads arn:aws:sns:us-west-2:985752 Safecast Bulk exports of air and radiation measurements arn:aws:s3:::safecast-opendata-public-us-east-1 us-east-1 S3 Bucket https://github.com/Safecast/safecastapi/wiki/Data-Sets https://groups.google.com/forum/#!forum/safecast-devices [Safecast](https://safecast.org/) Continuous Safecast data is published under a [CC0 designation](https://creativecommons.org air quality, aws-pds, climate, environmental, geospatial, radiation ['[Browse Bucket](https://safecast-opendata-public-us-east-1.s3.amazonaws.com/index.html)'] SatPM2.5 Satellite-Derived Fine Particulate Matter (PM25) concentrations from the Atmosp arn:aws:s3:::v6.pm25.global us-west-2 S3 Bucket https://sites.wustl.edu/acag/datasets/surface-pm2-5/#V6.GL.02 randall.martin@wustl.edu https://sites.wustl.edu/acag/ Yearly Creative Commons Attribution 4.0 International (https://creativecommons.org/lice atmosphere, netcdf, environmental, air quality, health ['[Browse Bucket](https://s3.us-west-2.amazonaws.com/v6.pm25.global/index.html)'] Satellite - Sea surface temperature - Level 3 - Single sensor - 1 day - Day and night time Cloud Optimised AODN dataset of IMOS - SRS - SST - L3S - Single Sensor - 1 day - arn:aws:s3:::aodn-cloud-optimised/satellite_ghrsst_l3s_1day_daynighttime_single_sensor_australia.zarr ap-southeast-2 S3 Bucket https://catalogue-imos.aodn.org.au/geonetwork/srv/eng/catalog.search#/metadata/a info@aodn.org.au AODN As Needed http://creativecommons.org/licenses/by/4.0/ oceans, satellite imagery +Satellogic EarthView dataset Satellogic data includes TOA RGBN COG, VISUAL RGB COG files data and metadata arn:aws:s3:::satellogic-earthview us-west-2 S3 Bucket https://satellogic-earthview.s3.us-west-2.amazonaws.com/index.html https://www.satellogic.com/ [Satellogic](https://www.satellogic.com) New data will be made available periodically, with annual updates expected in th [CC BY 4.0](https://creativecommons.org/licenses/by/4.0/deed.en) aws-pds, satellite imagery, earth observation, image processing, geospatial, computer vision, stac, cog ['[STAC Catalog](https://satellogic-earthview.s3.us-west-2.amazonaws.com/stac/catalog.json)', '[STAC Browser](https://radiantearth.github.io/stac-browser/#/external/satellogic-earthview.s3.us-west-2.amazonaws.com/stac/catalog.json)'] False Scottish Public Sector LiDAR Dataset LiDAR data (DSM, DTM and Laz) arn:aws:s3:::srsp-open-data eu-west-2 S3 Bucket https://remotesensingdata.gov.scot/data#/list https://remotesensingdata.gov.scot/feedback or email Scottish Government on gi-s [Joint Nature Conservation Committee](https://jncc.gov.uk/) New datasets have historically been added every 2-3 years but there is no guaran All data is made available under the [Open Government Licence v3](http://www.nat lidar, cities, coastal, environmental, urban, elevation, cog, aws-pds Sea Around Us Global Fisheries Catch Data Global Fisheries Catch Data arn:aws:s3:::fisheries-catch-data us-west-2 S3 Bucket https://www.seaaroundus.org/ubc-cic-sea-around-us-project-collaboration/ https://www.seaaroundus.org/feedback/ [Sea Around Us](https://www.seaaroundus.org/) The full dataset is computed only once or twice a year or when there is a signif This data is available for anyone to use under the [Sea Around Us Terms of Use]( aws-pds, fisheries, ecosystems, biodiversity, marine Sea Surface Temperature Daily Analysis: European Space Agency Climate Change Initiative product version 2.1 Global daily-mean sea surface temperatures from 1981 onwards, in Zarr format Th arn:aws:s3:::surftemp-sst us-west-2 S3 Bucket https://surftemp.github.io/sst-data-tutorials/ https://www.reading.ac.uk/met/ [University of Reading, Department of Meteorology](https://www.reading.ac.uk/met yearly Creative Commons Licence by attribution (https://creativecommons.org/licenses/by aws-pds, earth observation, oceans, climate, environmental, global, geospatial -Seattle Alzheimer's Disease Brain Cell Atlas (SEA-AD) Spatial transcriptomics data files in a public bucket arn:aws:s3:::sea-ad-spatial-transcriptomics us-west-2 S3 Bucket https://portal.brain-map.org/explore/seattle-alzheimers-disease/seattle-alzheime awspublicdataset@alleninstitute.org [Allen Institute](http://www.alleninstitute.org/) Annually https://alleninstitute.org/legal/terms-use/ aws-pds, biology, cell biology, cell imaging, epigenomics, gene expression, histopathology, Homo sapiens, imaging, medicine, microscopy, neurobiology, neuroscience, single-cell transcriptomics, transcriptomics, life sciences ['[Browse Bucket](https://sea-ad-spatial-transcriptomics.s3.amazonaws.com/index.html)'] Seattle Alzheimer's Disease Brain Cell Atlas (SEA-AD) Quantitative neuropathology (full resolution images, processed images, and quant arn:aws:s3:::sea-ad-quantitative-neuropathology us-west-2 S3 Bucket https://portal.brain-map.org/explore/seattle-alzheimers-disease/seattle-alzheime awspublicdataset@alleninstitute.org [Allen Institute](http://www.alleninstitute.org/) Annually https://alleninstitute.org/legal/terms-use/ aws-pds, biology, cell biology, cell imaging, epigenomics, gene expression, histopathology, Homo sapiens, imaging, medicine, microscopy, neurobiology, neuroscience, single-cell transcriptomics, transcriptomics, life sciences ['[Browse Bucket](https://sea-ad-quantitative-neuropathology.s3.amazonaws.com/index.html)'] Seattle Alzheimer's Disease Brain Cell Atlas (SEA-AD) Single cell profiling (transcriptomics and epigenomics) data files in a public b arn:aws:s3:::sea-ad-single-cell-profiling us-west-2 S3 Bucket https://portal.brain-map.org/explore/seattle-alzheimers-disease/seattle-alzheime awspublicdataset@alleninstitute.org [Allen Institute](http://www.alleninstitute.org/) Annually https://alleninstitute.org/legal/terms-use/ aws-pds, biology, cell biology, cell imaging, epigenomics, gene expression, histopathology, Homo sapiens, imaging, medicine, microscopy, neurobiology, neuroscience, single-cell transcriptomics, transcriptomics, life sciences ['[Browse Bucket](https://sea-ad-single-cell-profiling.s3.amazonaws.com/index.html)'] +Seattle Alzheimer's Disease Brain Cell Atlas (SEA-AD) Spatial transcriptomics data files in a public bucket arn:aws:s3:::sea-ad-spatial-transcriptomics us-west-2 S3 Bucket https://portal.brain-map.org/explore/seattle-alzheimers-disease/seattle-alzheime awspublicdataset@alleninstitute.org [Allen Institute](http://www.alleninstitute.org/) Annually https://alleninstitute.org/legal/terms-use/ aws-pds, biology, cell biology, cell imaging, epigenomics, gene expression, histopathology, Homo sapiens, imaging, medicine, microscopy, neurobiology, neuroscience, single-cell transcriptomics, transcriptomics, life sciences ['[Browse Bucket](https://sea-ad-spatial-transcriptomics.s3.amazonaws.com/index.html)'] SeeFar V0 Primary SeeFar dataset containing multi-resolution satellite imagery in cloud-op arn:aws:s3:::seefar-dataset us-east-1 S3 Bucket https://coastalcarbon.ai/seefar James Lowman Coastal Carbon Yearly The SeeFar dataset includes multiple licensing terms, specific to each satellite geospatial, earth observation, satellite imagery, climate, biodiversity, coastal, machine learning, environmental, sustainability, natural resource, global, mapping, aws-pds Sentinel Near Real-time Canada Mirror | Miroir Sentinel temps quasi réel du Canada Sentinel data over Canada | Données sentinelles au Canada arn:aws:s3:::sentinel-products-ca-mirror ca-central-1 S3 Bucket https://sentinel.esa.int/web/sentinel/home eodms-sgdot@nrcan-rncan.gc.ca [Natural Resources Canada](https://www.nrcan.gc.ca/) Sentinel-1 is an NRT dataset retrieved from ESA within 90 minutes of satellite d The access and use of Copernicus Sentinel data is available on a free, full and aws-pds, agriculture, earth observation, satellite imagery, geospatial, sustainability, disaster response, synthetic aperture radar, stac ['[EODMS STAC for Sentinel products](https://www.eodms-sgdot.nrcan-rncan.gc.ca/stac/)'] Sentinel-1 S3 Inventory files for L1C and CSV arn:aws:s3:::sentinel-inventory/ eu-central-1 S3 Bucket https://roda.sentinel-hub.com/sentinel-s1-l1c/GRD/readme.html https://forum.sentinel-hub.com/c/aws-sentinel [Sinergise](https://www.sinergise.com/) New Sentinel data are added regularly, usually within few hours after they are a Access to Sentinel data is free, full and open for the broad Regional, National, aws-pds, agriculture, earth observation, satellite imagery, geospatial, disaster response, cog, synthetic aperture radar @@ -1056,23 +1057,23 @@ Sentinel-1 Precise Orbit Determination (POD) Products Sentinel-1 Orbits bucket a Sentinel-1 Precise Orbit Determination (POD) Products Notifications for new data arn:aws:sns:us-west-2:211125554030:s1-orbits-object_created us-west-2 SNS Topic https://s1-orbits.s3.us-west-2.amazonaws.com/README.html https://asf.alaska.edu/asf/contact-us/ [The Alaska Satellite Facility (ASF)](https://asf.alaska.edu/) Updated as new data becomes available on the [Copernicus Data Space Ecosystem](h Access to Sentinel data is free, full and open for the broad Regional, National, auxiliary data, disaster response, earth observation, earthquakes, floods, geophysics, sentinel-1, synthetic aperture radar Sentinel-1 SLC dataset for Germany Public access to Sentinel-1 SLC IW scenes over Germany arn:aws:s3:::sentinel1-slc eu-west-1 S3 Bucket https://github.com/live-eo/sentinel1-slc/ For any enquires regarding the dataset, please email OpenData at Live-EO opendat [LiveEO](https://live-eo.com/) New Sentinel1-SLC IW data are updated regularly in an interval of 6 days, after The data usage will inherit and fully comply with the free and open data policy aws-pds, disaster response, satellite imagery, geospatial, sustainability, earth observation, environmental, synthetic aperture radar Sentinel-1 SLC dataset for South and Southeast Asia, Taiwan, Korea and Japan Public access to Sentinel-1 SLC IW scenes over South and Southeast Asia, Taiwan arn:aws:s3:::sentinel1-slc-seasia-pds ap-southeast-1 S3 Bucket https://github.com/earthobservatory/sentinel1-opds/ For any enquires regarding data delivery, please email ehill@ntu.edu.sg and stch [Earth Observatory of Singapore, Nanyang Technological University](https://earth S1 SLC data for the region of interest will be updated regularly, as it becomes The data usage will inherit and fully comply with the free and open data policy aws-pds, disaster response, satellite imagery, geospatial, earth observation, environmental, synthetic aperture radar -Sentinel-2 New scene notifications for L2A, can subscribe with Lambda arn:aws:sns:eu-central-1:214830741341:SentinelS2L2A eu-central-1 SNS Topic Documentation is available for [Sentinel-2 L1C](https://roda.sentinel-hub.com/se https://forum.sentinel-hub.com/c/aws-sentinel [Sinergise](https://www.sinergise.com/) New Sentinel data are added regularly, usually within few hours after they are a Access to Sentinel data is free, full and open for the broad Regional, National, aws-pds, agriculture, earth observation, satellite imagery, geospatial, natural resource, disaster response, stac +Sentinel-2 S3 Inventory files for L1C and CSV arn:aws:s3:::sentinel-inventory/sentinel-s2-l1c eu-central-1 S3 Bucket Documentation is available for [Sentinel-2 L1C](https://roda.sentinel-hub.com/se https://forum.sentinel-hub.com/c/aws-sentinel [Sinergise](https://www.sinergise.com/) New Sentinel data are added regularly, usually within few hours after they are a Access to Sentinel data is free, full and open for the broad Regional, National, aws-pds, agriculture, earth observation, satellite imagery, geospatial, natural resource, disaster response, stac Sentinel-2 New scene notifications for L1C, can subscribe with Lambda arn:aws:sns:eu-west-1:214830741341:NewSentinel2Product eu-west-1 SNS Topic Documentation is available for [Sentinel-2 L1C](https://roda.sentinel-hub.com/se https://forum.sentinel-hub.com/c/aws-sentinel [Sinergise](https://www.sinergise.com/) New Sentinel data are added regularly, usually within few hours after they are a Access to Sentinel data is free, full and open for the broad Regional, National, aws-pds, agriculture, earth observation, satellite imagery, geospatial, natural resource, disaster response, stac -Sentinel-2 Zipped archives for each L2A product with 3 day retention period, in Requester P arn:aws:s3:::sentinel-s2-l2a-zips eu-central-1 S3 Bucket Documentation is available for [Sentinel-2 L1C](https://roda.sentinel-hub.com/se https://forum.sentinel-hub.com/c/aws-sentinel [Sinergise](https://www.sinergise.com/) New Sentinel data are added regularly, usually within few hours after they are a Access to Sentinel data is free, full and open for the broad Regional, National, aws-pds, agriculture, earth observation, satellite imagery, geospatial, natural resource, disaster response, stac True -Sentinel-2 Zipped archives for each L1C product with 3 day retention period, in Requester P arn:aws:s3:::sentinel-s2-l1c-zips eu-central-1 S3 Bucket Documentation is available for [Sentinel-2 L1C](https://roda.sentinel-hub.com/se https://forum.sentinel-hub.com/c/aws-sentinel [Sinergise](https://www.sinergise.com/) New Sentinel data are added regularly, usually within few hours after they are a Access to Sentinel data is free, full and open for the broad Regional, National, aws-pds, agriculture, earth observation, satellite imagery, geospatial, natural resource, disaster response, stac True Sentinel-2 S3 Inventory files for L2A and CSV arn:aws:s3:::sentinel-inventory/sentinel-s2-l2a eu-central-1 S3 Bucket Documentation is available for [Sentinel-2 L1C](https://roda.sentinel-hub.com/se https://forum.sentinel-hub.com/c/aws-sentinel [Sinergise](https://www.sinergise.com/) New Sentinel data are added regularly, usually within few hours after they are a Access to Sentinel data is free, full and open for the broad Regional, National, aws-pds, agriculture, earth observation, satellite imagery, geospatial, natural resource, disaster response, stac +Sentinel-2 Zipped archives for each L1C product with 3 day retention period, in Requester P arn:aws:s3:::sentinel-s2-l1c-zips eu-central-1 S3 Bucket Documentation is available for [Sentinel-2 L1C](https://roda.sentinel-hub.com/se https://forum.sentinel-hub.com/c/aws-sentinel [Sinergise](https://www.sinergise.com/) New Sentinel data are added regularly, usually within few hours after they are a Access to Sentinel data is free, full and open for the broad Regional, National, aws-pds, agriculture, earth observation, satellite imagery, geospatial, natural resource, disaster response, stac True +Sentinel-2 Zipped archives for each L2A product with 3 day retention period, in Requester P arn:aws:s3:::sentinel-s2-l2a-zips eu-central-1 S3 Bucket Documentation is available for [Sentinel-2 L1C](https://roda.sentinel-hub.com/se https://forum.sentinel-hub.com/c/aws-sentinel [Sinergise](https://www.sinergise.com/) New Sentinel data are added regularly, usually within few hours after they are a Access to Sentinel data is free, full and open for the broad Regional, National, aws-pds, agriculture, earth observation, satellite imagery, geospatial, natural resource, disaster response, stac True Sentinel-2 Level 2A scenes and metadata, in Requester Pays S3 bucket arn:aws:s3:::sentinel-s2-l2a eu-central-1 S3 Bucket Documentation is available for [Sentinel-2 L1C](https://roda.sentinel-hub.com/se https://forum.sentinel-hub.com/c/aws-sentinel [Sinergise](https://www.sinergise.com/) New Sentinel data are added regularly, usually within few hours after they are a Access to Sentinel data is free, full and open for the broad Regional, National, aws-pds, agriculture, earth observation, satellite imagery, geospatial, natural resource, disaster response, stac ['[STAC V1.0.0 endpoint](https://sentinel-s2-l2a-stac.s3.amazonaws.com/)'] True -Sentinel-2 S3 Inventory files for L1C and CSV arn:aws:s3:::sentinel-inventory/sentinel-s2-l1c eu-central-1 S3 Bucket Documentation is available for [Sentinel-2 L1C](https://roda.sentinel-hub.com/se https://forum.sentinel-hub.com/c/aws-sentinel [Sinergise](https://www.sinergise.com/) New Sentinel data are added regularly, usually within few hours after they are a Access to Sentinel data is free, full and open for the broad Regional, National, aws-pds, agriculture, earth observation, satellite imagery, geospatial, natural resource, disaster response, stac Sentinel-2 Level 1C scenes and metadata, in Requester Pays S3 bucket arn:aws:s3:::sentinel-s2-l1c eu-central-1 S3 Bucket Documentation is available for [Sentinel-2 L1C](https://roda.sentinel-hub.com/se https://forum.sentinel-hub.com/c/aws-sentinel [Sinergise](https://www.sinergise.com/) New Sentinel data are added regularly, usually within few hours after they are a Access to Sentinel data is free, full and open for the broad Regional, National, aws-pds, agriculture, earth observation, satellite imagery, geospatial, natural resource, disaster response, stac ['[Earth Search STAC L1C Collection](https://earth-search.aws.element84.com/v1/collections/sentinel-2-l1c)', '[Earth Search STAC Browser L1C Collection](https://radiantearth.github.io/stac-browser/#/external/earth-search.aws.element84.com/v1/collections/sentinel-2-l1c)', '[STAC V1.0.0 endpoint](https://sentinel-s2-l1c-stac.s3.amazonaws.com/)', '[Earth Viewer by Element 84](https://viewer.aws.element84.com/)'] True +Sentinel-2 New scene notifications for L2A, can subscribe with Lambda arn:aws:sns:eu-central-1:214830741341:SentinelS2L2A eu-central-1 SNS Topic Documentation is available for [Sentinel-2 L1C](https://roda.sentinel-hub.com/se https://forum.sentinel-hub.com/c/aws-sentinel [Sinergise](https://www.sinergise.com/) New Sentinel data are added regularly, usually within few hours after they are a Access to Sentinel data is free, full and open for the broad Regional, National, aws-pds, agriculture, earth observation, satellite imagery, geospatial, natural resource, disaster response, stac Sentinel-2 ACOLITE-DSF Aquatic Reflectance for the Conterminous United States New scene notification arn:aws:sns:us-west-2:242201296900:usgs-wma-sentinel-2-aqr-acolite-dsf-object_created us-west-2 SNS Topic https://www.sciencebase.gov/catalog/item/640f612dd34e254fd352e1ed tvking@usgs.gov [United States Geological Survey](https://www.usgs.gov) New scenes are added daily. Contains modified Copernicus Sentinel data, which is available under the Creativ aws-pds, earth observation, satellite imagery, geospatial, natural resource, cog, water Sentinel-2 ACOLITE-DSF Aquatic Reflectance for the Conterminous United States Scenes and metadata arn:aws:s3:::usgs-wma-sentinel-2-aqr-acolite-dsf/version_01 us-west-2 S3 Bucket https://www.sciencebase.gov/catalog/item/640f612dd34e254fd352e1ed tvking@usgs.gov [United States Geological Survey](https://www.usgs.gov) New scenes are added daily. Contains modified Copernicus Sentinel data, which is available under the Creativ aws-pds, earth observation, satellite imagery, geospatial, natural resource, cog, water Sentinel-2 Cloud-Optimized GeoTIFFs New scene notifications, can subscribe with Lambda arn:aws:sns:us-west-2:608149789419:cirrus-v0-publish us-west-2 SNS Topic https://github.com/cirrus-geo/cirrus-earth-search opendata@element84.com [Element 84](https://www.element84.com/) New Sentinel data are added regularly, usually within few hours after they are a Access to Sentinel data is free, full and open for the broad Regional, National, aws-pds, agriculture, earth observation, satellite imagery, geospatial, natural resource, disaster response, cog, stac -Sentinel-2 Cloud-Optimized GeoTIFFs S3 Inventory files for L1C and CSV arn:aws:s3:::sentinel-cogs-inventory us-west-2 S3 Bucket https://github.com/cirrus-geo/cirrus-earth-search opendata@element84.com [Element 84](https://www.element84.com/) New Sentinel data are added regularly, usually within few hours after they are a Access to Sentinel data is free, full and open for the broad Regional, National, aws-pds, agriculture, earth observation, satellite imagery, geospatial, natural resource, disaster response, cog, stac Sentinel-2 Cloud-Optimized GeoTIFFs Level 2A scenes and metadata arn:aws:s3:::sentinel-cogs us-west-2 S3 Bucket https://github.com/cirrus-geo/cirrus-earth-search opendata@element84.com [Element 84](https://www.element84.com/) New Sentinel data are added regularly, usually within few hours after they are a Access to Sentinel data is free, full and open for the broad Regional, National, aws-pds, agriculture, earth observation, satellite imagery, geospatial, natural resource, disaster response, cog, stac ['[Earth Search STAC L2A Collection](https://earth-search.aws.element84.com/v1/collections/sentinel-2-l2a)', '[STAC Browser L2A Collection](https://radiantearth.github.io/stac-browser/#/external/earth-search.aws.element84.com/v1/collections/sentinel-2-l2a)'] False +Sentinel-2 Cloud-Optimized GeoTIFFs S3 Inventory files for L1C and CSV arn:aws:s3:::sentinel-cogs-inventory us-west-2 S3 Bucket https://github.com/cirrus-geo/cirrus-earth-search opendata@element84.com [Element 84](https://www.element84.com/) New Sentinel data are added regularly, usually within few hours after they are a Access to Sentinel data is free, full and open for the broad Regional, National, aws-pds, agriculture, earth observation, satellite imagery, geospatial, natural resource, disaster response, cog, stac Sentinel-2 L2A 120m Mosaic Sentinel-2 L2A 120m mosaics data in a S3 bucket arn:aws:s3:::sentinel-s2-l2a-mosaic-120 eu-central-1 S3 Bucket Documentation is available [here](https://sentinel-s2-l2a-mosaic-120.s3.amazonaw https://forum.sentinel-hub.com/c/aws-sentinel [Sinergise](https://www.sinergise.com/) New data will be added annually. CC-BY 4.0, Credit: Contains modified Copernicus data [year] processed by Sentine aws-pds, agriculture, earth observation, satellite imagery, geospatial, natural resource, machine learning, cog False -Sentinel-3 Sentinel-3 Near Real Time Data (NRT) format arn:aws:s3:::meeo-s3/NRT/ eu-central-1 S3 Bucket https://github.com/Sentinel-5P/data-on-s3/blob/master/DocsForAws/Sentinel3Descri sentinel3@meeo.it [Meteorological Environmental Earth Observation](http://www.meeo.it/) Daily https://sentinel.esa.int/documents/247904/690755/Sentinel_Data_Legal_Notice aws-pds, oceans, earth observation, environmental, geospatial, land, satellite imagery, cog, stac -Sentinel-3 Sentinel-3 Not Time Critical (NTC) format arn:aws:s3:::meeo-s3/NTC/ eu-central-1 S3 Bucket https://github.com/Sentinel-5P/data-on-s3/blob/master/DocsForAws/Sentinel3Descri sentinel3@meeo.it [Meteorological Environmental Earth Observation](http://www.meeo.it/) Daily https://sentinel.esa.int/documents/247904/690755/Sentinel_Data_Legal_Notice aws-pds, oceans, earth observation, environmental, geospatial, land, satellite imagery, cog, stac Sentinel-3 Sentinel-3 Short Time Critical (STC) format arn:aws:s3:::meeo-s3/STC/ eu-central-1 S3 Bucket https://github.com/Sentinel-5P/data-on-s3/blob/master/DocsForAws/Sentinel3Descri sentinel3@meeo.it [Meteorological Environmental Earth Observation](http://www.meeo.it/) Daily https://sentinel.esa.int/documents/247904/690755/Sentinel_Data_Legal_Notice aws-pds, oceans, earth observation, environmental, geospatial, land, satellite imagery, cog, stac +Sentinel-3 Sentinel-3 Not Time Critical (NTC) format arn:aws:s3:::meeo-s3/NTC/ eu-central-1 S3 Bucket https://github.com/Sentinel-5P/data-on-s3/blob/master/DocsForAws/Sentinel3Descri sentinel3@meeo.it [Meteorological Environmental Earth Observation](http://www.meeo.it/) Daily https://sentinel.esa.int/documents/247904/690755/Sentinel_Data_Legal_Notice aws-pds, oceans, earth observation, environmental, geospatial, land, satellite imagery, cog, stac +Sentinel-3 Sentinel-3 Near Real Time Data (NRT) format arn:aws:s3:::meeo-s3/NRT/ eu-central-1 S3 Bucket https://github.com/Sentinel-5P/data-on-s3/blob/master/DocsForAws/Sentinel3Descri sentinel3@meeo.it [Meteorological Environmental Earth Observation](http://www.meeo.it/) Daily https://sentinel.esa.int/documents/247904/690755/Sentinel_Data_Legal_Notice aws-pds, oceans, earth observation, environmental, geospatial, land, satellite imagery, cog, stac Sentinel-3 Sentinel-3 Cloud Optimized GeoTIFF (COG) format arn:aws:s3:::meeo-s3-cog/ eu-central-1 S3 Bucket https://github.com/Sentinel-5P/data-on-s3/blob/master/DocsForAws/Sentinel3Descri sentinel3@meeo.it [Meteorological Environmental Earth Observation](http://www.meeo.it/) Daily https://sentinel.esa.int/documents/247904/690755/Sentinel_Data_Legal_Notice aws-pds, oceans, earth observation, environmental, geospatial, land, satellite imagery, cog, stac ['[STAC V1.0.0 endpoint](https://meeo-s3.s3.amazonaws.com/)'] Sentinel-5P Level 2 Sentinel-5p Near Real Time Data (NRTI) NetCDF format arn:aws:s3:::meeo-s5p/NRTI/ eu-central-1 S3 Bucket https://github.com/Sentinel-5P/data-on-s3/blob/master/DocsForAws/Sentinel5P_Desc sentinel5p@meeo.it [Meteorological Environmental Earth Observation](http://www.meeo.it/) Daily https://sentinel.esa.int/documents/247904/690755/Sentinel_Data_Legal_Notice aws-pds, air quality, atmosphere, earth observation, environmental, geospatial, satellite imagery, cog, stac Sentinel-5P Level 2 Sentinel-5p Off Line Data (OFFL) NetCDF format arn:aws:s3:::meeo-s5p/OFFL/ eu-central-1 S3 Bucket https://github.com/Sentinel-5P/data-on-s3/blob/master/DocsForAws/Sentinel5P_Desc sentinel5p@meeo.it [Meteorological Environmental Earth Observation](http://www.meeo.it/) Daily https://sentinel.esa.int/documents/247904/690755/Sentinel_Data_Legal_Notice aws-pds, air quality, atmosphere, earth observation, environmental, geospatial, satellite imagery, cog, stac @@ -1090,8 +1091,8 @@ Single-Cell Atlas of Human Blood During Healthy Aging Raw sequencing data (fastq Smithsonian Open Access Smithsonian Open Access Media and Metadata arn:aws:s3:::smithsonian-open-access us-west-2 S3 Bucket http://edan.si.edu/openaccess/docs/ openaccess@si.edu [SI](http://www.si.edu/) New / updated metadata and image files will be pushed weekly. CC0 aws-pds, art, history, culture, museum, encyclopedic SocialGene RefSeq Databases SocialGene 2023_v041 Data and Database Dumps arn:aws:s3:::socialgene-open-data us-east-2 S3 Bucket https://socialgene.github.io/precomputed_databases/2023_v0.4.1/aws/aws https://github.com/socialgene/socialgene.github.io/issues University of Wisconsin-Madison This database is currently what was published in our 2024 paper introducing Soci Where applicable, SocialGene data is released under CC0 (https://creativecommons metagenomics, genomic, bioinformatics, microbiome, chemical biology, pharmaceutical, graph, protein, amino acid ['[Browse Bucket](https://socialgene-open-data.s3.amazonaws.com/)'] Sofar Spotter Archive Hourly position, wave spectra and bulk wave parameters from global free drifting arn:aws:s3:::sofar-spotter-archive us-west-2 S3 Bucket [Spotter Technical Reference Manual](https://content.sofarocean.com/hubfs/Spotte opendata@sofarocean.com [Sofar Ocean](https://www.sofarocean.com/company/contact-us) As available [Sofar Data Access Agreement](https://sofarocean.notion.site/sofarocean/Sofar-Da aws-pds, climate, meteorological, sustainability, weather, oceans, environmental, oceans ['[Browse Bucket](https://sofar-spotter-archive.s3.amazonaws.com/index.html)'] -Software Heritage Graph Dataset S3 Inventory files arn:aws:s3:::softwareheritage-inventory us-east-1 S3 Bucket https://docs.softwareheritage.org/devel/swh-dataset/graph/athena.html aws@softwareheritage.org Software Heritage Data is updated yearly Creative Commons Attribution 4.0 International.By accessing the dataset, you agr aws-pds, source code, open source software, free software, digital preservation Software Heritage Graph Dataset Software Heritage Graph Dataset arn:aws:s3:::softwareheritage us-east-1 S3 Bucket https://docs.softwareheritage.org/devel/swh-dataset/graph/athena.html aws@softwareheritage.org Software Heritage Data is updated yearly Creative Commons Attribution 4.0 International.By accessing the dataset, you agr aws-pds, source code, open source software, free software, digital preservation +Software Heritage Graph Dataset S3 Inventory files arn:aws:s3:::softwareheritage-inventory us-east-1 S3 Bucket https://docs.softwareheritage.org/devel/swh-dataset/graph/athena.html aws@softwareheritage.org Software Heritage Data is updated yearly Creative Commons Attribution 4.0 International.By accessing the dataset, you agr aws-pds, source code, open source software, free software, digital preservation Solar Dynamics Observatory (SDO) Machine Learning Dataset The v1 dataset includes AIA observations 2010-2018 and v2 includes AIA observati arn:aws:s3:::gov-nasa-hdrl-data1/contrib/fdl-sdoml/ us-west-2 S3 Bucket https://github.com/SDOML/sdoml.github.io Meng Jin (jinmeng@lmsal.com) and Paul Wright (paul@pauljwright.co.uk) [NASA](http://www.nasa.gov/) N/A (The IDL/Python scripts for generating the datasets are published online, wh There are no restrictions on the use of this data. aws-pds, machine learning, NASA SMD AI SondeHub Radiosonde Telemetry Radiosonde Telemetry as JSON blobs of Universal Telemetry format arn:aws:s3:::sondehub-history us-east-1 S3 Bucket https://github.com/projecthorus/sondehub-infra/wiki/Amazon-Open-Data Michaela Wheeler [SondeHub](https://sondehub.org/) Data is updated as we receive it Creative Commons BY-SA 2.0 aws-pds, climate, environmental, weather, GPS ['[Browse Bucket by serial number](http://sondehub-history.s3-website-us-east-1.amazonaws.com/#serial/)', '[Browse Bucket by date/time](http://sondehub-history.s3-website-us-east-1.amazonaws.com/#date/)'] Sophos/ReversingLabs 20 Million malware detection dataset Sophos/ReversingLabs 20 million sample dataset arn:aws:s3:::sorel-20m/ us-west-2 S3 Bucket https://github.com/sophos-ai/SOREL-20M/blob/master/README.md sorel-dataset@sophos.com Sophos AI At most annually See the [Terms of Use](https://github.com/sophos-ai/SOREL-20M/blob/master/Terms% aws-pds, cyber security, deep learning, labeled, machine learning @@ -1105,8 +1106,8 @@ Storm EVent ImageRy (SEVIR) Dataset of storm imagery arn:aws:s3:::sevir us-west- Sub-Meter Canopy Tree Height of California in 2020 by CTrees.org Cloud-optimized GeoTIFF files with names corresponding to image of California fo arn:aws:s3:::ctrees-tree-height-ca-2020/ us-west-2 S3 Bucket [Project overview](https://ctrees.org/products/tree-level) info@ctrees.org [CTrees](https://ctrees.org/) TBD https://creativecommons.org/licenses/by/4.0/ aws-pds, cog, earth observation, land cover, deep learning, aerial imagery, image processing, environmental, conservation, geospatial Sudachi Language Resources SudachiDict: Binary format of the mophological analysis dictionarieschiVe: Pret arn:aws:s3:::sudachi ap-northeast-1 S3 Bucket https://worksapplications.github.io/Sudachi/ sudachi@worksap.co.jp [Works Applications](https://www.worksap.co.jp/about/csr/nlp/) The dictionaries are updated every few months to include neologism and fixes for Apache-2.0 aws-pds, natural language processing Sudachi Language Resources Cloudfront CDN mirror ap-northeast-1 CloudFront Distribution https://worksapplications.github.io/Sudachi/ sudachi@worksap.co.jp [Works Applications](https://www.worksap.co.jp/about/csr/nlp/) The dictionaries are updated every few months to include neologism and fixes for Apache-2.0 aws-pds, natural language processing d2ej7fkh96fzlu.cloudfront.net -Sup3rCC Sup3rCC Generative Models arn:aws:s3:::nrel-pds-sup3rcc/models/ us-west-2 S3 Bucket https://github.com/NREL/sup3r Grant Buster (grant.buster@nrel.gov) [National Renewable Energy Laboratory](https://www.nrel.gov/) Annual Creative Commons Attribution 4.0 United States License aws-pds, energy, solar, air temperature, climate model ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-sup3rcc&prefix=models%2F)'] Sup3rCC Sup3rCC - CONUS - MRI ESM 20 - SSP585 - r1i1p1f1 arn:aws:s3:::nrel-pds-sup3rcc/conus_mriesm20_ssp585_r1i1p1f1/ us-west-2 S3 Bucket https://github.com/NREL/sup3r Grant Buster (grant.buster@nrel.gov) [National Renewable Energy Laboratory](https://www.nrel.gov/) Annual Creative Commons Attribution 4.0 United States License aws-pds, energy, solar, air temperature, climate model ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-sup3rcc&prefix=conus_mriesm20_ssp585_r1i1p1f1%2F)'] +Sup3rCC Sup3rCC Generative Models arn:aws:s3:::nrel-pds-sup3rcc/models/ us-west-2 S3 Bucket https://github.com/NREL/sup3r Grant Buster (grant.buster@nrel.gov) [National Renewable Energy Laboratory](https://www.nrel.gov/) Annual Creative Commons Attribution 4.0 United States License aws-pds, energy, solar, air temperature, climate model ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-sup3rcc&prefix=models%2F)'] Sup3rCC Sup3rCC arn:aws:s3:::nrel-pds-sup3rcc/ us-west-2 S3 Bucket https://github.com/NREL/sup3r Grant Buster (grant.buster@nrel.gov) [National Renewable Energy Laboratory](https://www.nrel.gov/) Annual Creative Commons Attribution 4.0 United States License aws-pds, energy, solar, air temperature, climate model ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-sup3rcc)'] Swiss Public Transport Stops data files ESRI FGDB, CSV , MapInfo, Interlis arn:aws:s3:::data.geo.admin.ch/ch.bav.haltestellen-oev/data.zip eu-west-1 S3 Bucket https://www.bav.admin.ch/bav/de/home/allgemeine-themen/fachthemen/geoinformation fredi.daellenbach@bav.admin.ch Swiss Geoportal annually You may use this dataset for non-commercial purposes. You may use this dataset f aws-pds, cities, geospatial, infrastructure, mapping, traffic, transportation ['[Browse Bucket](https://data.geo.admin.ch/index.html)'] Synthea Coherent Data Set Synthetic data set that includes FHIR resources, DICOM images, genomic data, phy arn:aws:s3:::synthea-open-data/coherent/ us-east-1 S3 Bucket https://doi.org/10.3390/electronics11081199 synthea-list@groups.mitre.org [The MITRE Corporation](https://www.mitre.org) Rarely [Creative Commons Attribution 4.0 International License](https://creativecommons aws-pds, health, bioinformatics, life sciences, medicine, csv, dicom, genomic, imaging @@ -1134,8 +1135,8 @@ The Singapore Nanopore Expression Data Set Nanopore long read RNA Seq data from The University of California San Francisco Brain Metastases Stereotactic Radiosurgery (UCSF-BMSR) MRI Dataset Zip archive containing NifTI files arn:aws:s3:::ucsf-dmi/UCSF_BrainMetastases_v1.zip us-west-1 S3 Bucket https://imagingdatasets.ucsf.edu/dataset/1 dmi-support@ucsf.edu [UCSF Center for Intelligent Imaging](https://intelligentimaging.ucsf.edu/) ad hoc Custom, non-commerical, attribution, no redistribution, no re-identification. F aws-pds, cancer, life sciences, magnetic resonance imaging, medicine, medical imaging, radiology https://imagingdatasets.ucsf.edu/dataset/1 Therapeutically Applicable Research to Generate Effective Treatments (TARGET) Clinical Supplement, Biospecimen Supplement, RNA-Seq Gene Expression Quantificat arn:aws:s3:::gdc-target-phs000218-2-open us-east-1 S3 Bucket https://ocg.cancer.gov/programs/target/ dcf-support@datacommons.io [Center for Translational Data Science at The University of Chicago](https://ctd Genomic Data Commons (GDC) is source of truth for this dataset; GDC offers month NIH Genomic Data Sharing Policy: https://gdc.cancer.gov/access-data/data-access- aws-pds, cancer, genomic, life sciences, whole genome sequencing, STRIDES Toxicant Exposures and Responses by Genomic and Epigenomic Regulators of Transcription (TaRGET) Released and archived TaRGET II data arn:aws:s3:::targetepigenomics us-west-2 S3 Bucket https://data.targetepigenomics.org/ targetdcc16@gmail.com TaRGET II Data Coordination Center (TaRGET-DCC) TaRGET-DCC offers monthly data releases, although this dataset may not be update External data users may freely download, analyze, and publish results based on a biology, bioinformatics, genetic, genomic, life sciences, environmental, epigenomics, aws-pds -Transiting Exoplanet Survey Satellite (TESS) TESS Mission data files arn:aws:s3:::stpubdata/tess us-east-1 S3 Bucket https://archive.stsci.edu/missions-and-data/tess archive@stsci.edu [Space Telescope Science Institute](http://www.stsci.edu/) Monthly Public domain. Attribution required for refereed scientific papers. astronomy, aws-pds False Transiting Exoplanet Survey Satellite (TESS) Notifications for new data arn:aws:sns:us-east-1:879230861493:stpubdata/tess us-east-1 SNS Topic https://archive.stsci.edu/missions-and-data/tess archive@stsci.edu [Space Telescope Science Institute](http://www.stsci.edu/) Monthly Public domain. Attribution required for refereed scientific papers. astronomy, aws-pds +Transiting Exoplanet Survey Satellite (TESS) TESS Mission data files arn:aws:s3:::stpubdata/tess us-east-1 S3 Bucket https://archive.stsci.edu/missions-and-data/tess archive@stsci.edu [Space Telescope Science Institute](http://www.stsci.edu/) Monthly Public domain. Attribution required for refereed scientific papers. astronomy, aws-pds False Tropical Cyclone Precipitation, Infrared, Microwave, and Environmental Dataset (TC PRIMED) The Tropical Cyclone Precipitation, Infrared, Microwave and Environmental Datase arn:aws:s3:::noaa-nesdis-tcprimed-pds us-east-1 S3 Bucket https://rammb-data.cira.colostate.edu/tcprimed/TCPRIMED_v01r00_documentation.pdf CIRA_tcprimed [at] colostate [dot] edu [CIRA](https://www.cira.colostate.edu/) Annually, several months after the conclusion of the Northern Hemisphere tropica No constraints on data access or use atmosphere, aws-pds, earth observation, environmental, geophysics, geoscience, global, meteorological, model, netcdf, precipitation, satellite imagery, weather ['[Browse Bucket](https://noaa-nesdis-tcprimed-pds.s3.amazonaws.com/index.html)'] U.S. Census ACS PUMS PUMS data in Turtle - Terse RDF Triple Language (ttl) format along with ontolog arn:aws:s3:::dataworld-linked-acs us-east-1 S3 Bucket https://docs.data.world/uscensus/#american-community-survey-linked-open-data https://docs.data.world/uscensus/#60---contact Data.world Yearly, after ACS 1-year PUMS raw data are released [Creative Commons Attribution 4.0 International (CC BY 4.0)](https://creativecom aws-pds, statistics, census, survey UCSC Genome Browser Sequence and Annotations https://genomeucscedu/FAQ/FAQformathtml arn:aws:s3:::genome-browser us-east-1 S3 Bucket https://hgdownload.soe.ucsc.edu/downloads.html https://genome.ucsc.edu/contacts.html University of California Santa Cruz Genome Institute Monthly [Public domain, some tracks require attribution](https://genome.ucsc.edu/license aws-pds, genetic, genomic, life sciences, bioinformatics, biology @@ -1152,30 +1153,30 @@ USGS Landsat Scenes and metadata arn:aws:s3:::usgs-landsat/collection02/ us-west USearch Molecules Project data files in a public bucket arn:aws:s3:::usearch-molecules us-west-2 S3 Bucket https://github.com/ashvardanian/usearch-molecules ash.vardanian@unum.cloud [Ash Vardanian](https://ashvardanian.com) Not updated [Apache 2.0](https://www.apache.org/licenses/LICENSE-2.0) aws-pds, life sciences, biology, chemical biology, pharmaceutical Umbra Synthetic Aperture Radar (SAR) Open Data Umbra Spotlight collects including GEC, SICD, SIDD, CPHD data and metadata arn:aws:s3:::umbra-open-data-catalog us-west-2 S3 Bucket https://help.umbra.space/product-guide help@umbra.space [Umbra](http://umbra.space/) New data is added frequently. The frequent updates enable users to analyze the t All data is provided with a Creative Commons License ([CC by 4.0](https://umbra. aws-pds, synthetic aperture radar, stac, satellite imagery, earth observation, image processing, geospatial ['[Browse Bucket](http://umbra-open-data-catalog.s3-website.us-west-2.amazonaws.com/)', '[STAC Browser](https://radiantearth.github.io/stac-browser/#/external/s3.us-west-2.amazonaws.com/umbra-open-data-catalog/stac/catalog.json)'] False Unblurred Coadds of the Wide-field Infrared Survey Explorer (unWISE) The unWISE Time-Domain Catalog is based on 'time-resolved' coadds, each of which arn:aws:s3:::nasa-irsa-wise/unwise/ us-west-2 S3 Bucket https://irsa.ipac.caltech.edu/data/WISE/unWISE/overview.html https://irsa.ipac.caltech.edu/docs/help_desk.html NASA/IPAC Infrared Science Archive ([IRSA](https://irsa.ipac.caltech.edu)) at Ca The unWISE dataset is updated periodically to include new data released by NEOWI https://irsa.ipac.caltech.edu/data_use_terms.html aws-pds, astronomy, object detection, parquet, survey False False -UniProt UniProt 2024_02 arn:aws:s3:::aws-open-data-uniprot-rdf/2024-02/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL -UniProt UniProt 2024_03 arn:aws:s3:::aws-open-data-uniprot-rdf/2024-03/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL -UniProt UniProt 2024_05 arn:aws:s3:::aws-open-data-uniprot-rdf/2024-05/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL +UniProt UniProt 2021_03 arn:aws:s3:::aws-open-data-uniprot-rdf/2021-03/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL UniProt UniProt 2021_01 arn:aws:s3:::aws-open-data-uniprot-rdf/2021-01/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL UniProt UniProt 2021_02 arn:aws:s3:::aws-open-data-uniprot-rdf/2021-02/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL -UniProt UniProt 2021_03 arn:aws:s3:::aws-open-data-uniprot-rdf/2021-03/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL UniProt UniProt 2021_04 arn:aws:s3:::aws-open-data-uniprot-rdf/2021-04/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL -UniProt UniProt 2022_01 arn:aws:s3:::aws-open-data-uniprot-rdf/2022-01/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL +UniProt UniProt 2022_02 arn:aws:s3:::aws-open-data-uniprot-rdf/2022-02/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL UniProt UniProt 2022_03 arn:aws:s3:::aws-open-data-uniprot-rdf/2022-03/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL -UniProt UniProt 2023_05 arn:aws:s3:::aws-open-data-uniprot-rdf/2023-05/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL -UniProt UniProt 2022_04 arn:aws:s3:::aws-open-data-uniprot-rdf/2022-04/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL +UniProt UniProt 2022_01 arn:aws:s3:::aws-open-data-uniprot-rdf/2022-01/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL UniProt UniProt 2022_05 arn:aws:s3:::aws-open-data-uniprot-rdf/2022-05/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL -UniProt UniProt 2023_01 arn:aws:s3:::aws-open-data-uniprot-rdf/2023-01/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL -UniProt UniProt 2023_02 arn:aws:s3:::aws-open-data-uniprot-rdf/2023-02/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL +UniProt UniProt 2024_05 arn:aws:s3:::aws-open-data-uniprot-rdf/2024-05/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL +UniProt UniProt 2024_03 arn:aws:s3:::aws-open-data-uniprot-rdf/2024-03/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL +UniProt UniProt 2024_02 arn:aws:s3:::aws-open-data-uniprot-rdf/2024-02/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL +UniProt UniProt 2022_04 arn:aws:s3:::aws-open-data-uniprot-rdf/2022-04/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL +UniProt UniProt 2023_05 arn:aws:s3:::aws-open-data-uniprot-rdf/2023-05/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL +UniProt UniProt 2024_01 arn:aws:s3:::aws-open-data-uniprot-rdf/2024-01/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL UniProt UniProt 2023_03 arn:aws:s3:::aws-open-data-uniprot-rdf/2023-03/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL +UniProt UniProt 2023_02 arn:aws:s3:::aws-open-data-uniprot-rdf/2023-02/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL +UniProt UniProt 2023_01 arn:aws:s3:::aws-open-data-uniprot-rdf/2023-01/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL UniProt UniProt 2023_04 arn:aws:s3:::aws-open-data-uniprot-rdf/2023-04/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL -UniProt UniProt 2022_02 arn:aws:s3:::aws-open-data-uniprot-rdf/2022-02/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL -UniProt UniProt 2024_01 arn:aws:s3:::aws-open-data-uniprot-rdf/2024-01/ eu-west-3 S3 Bucket https://www.uniprot.org/help/about https://www.uniprot.org/contact [SIB Swiss Institute of Bioinformatics](https://sp.sib.swiss/) on behalf of the Under 1 months after a new UniProt release. http://creativecommons.org/licenses/by/4.0/ aws-pds, chemistry, protein, enzyme, molecule, life sciences, bioinformatics, biology, RDF, graph, SPARQL University of British Columbia Sunflower Genome Dataset UBC Sunflower Genome Data 1 arn:aws:s3:::ubc-sunflower-genome us-west-2 S3 Bucket https://rieseberglab.github.io/ubc-sunflower-genome/ UBC Botany Sunflower The Rieseberg Lab at the University of British Columbia Twice per year. Public Domain aws-pds, agriculture, biodiversity, bioinformatics, biology, food security, genetic, genomic, life sciences, whole genome sequencing VENUS L2A Cloud-Optimized GeoTIFFs New Venus L2A dataset notifications, can subscribe with Lambda arn:aws:sns:us-east-1:794383284256:venus-l2a-cogs-object_created us-east-1 SNS Topic https://github.com/earthdaily/venus-on-aws/ Klaus Bachhuber - klaus.bachhuber@earthdaily.com [EarthDaily Analytics](https://earthdaily.com/) New Venus data are added regularly https://creativecommons.org/licenses/by-nc/4.0/ aws-pds, agriculture, earth observation, satellite imagery, geospatial, image processing, natural resource, disaster response, cog, stac, activity detection, environmental, land cover VENUS L2A Cloud-Optimized GeoTIFFs Venus L2A dataset (COG) and metadata (STAC) arn:aws:s3:::venus-l2a-cogs us-east-1 S3 Bucket https://github.com/earthdaily/venus-on-aws/ Klaus Bachhuber - klaus.bachhuber@earthdaily.com [EarthDaily Analytics](https://earthdaily.com/) New Venus data are added regularly https://creativecommons.org/licenses/by-nc/4.0/ aws-pds, agriculture, earth observation, satellite imagery, geospatial, image processing, natural resource, disaster response, cog, stac, activity detection, environmental, land cover ['[STAC Browser Venus L2A (COG) Catalog](https://radiantearth.github.io/stac-browser/#/external/venus-l2a-cogs.s3.us-east-1.amazonaws.com/catalog.json)'] False Variant Effect Predictor (VEP) and the Loss-Of-Function Transcript Effect Estimator (LOFTEE) Plugin VEP and LOFTEE data arn:aws:s3:::hail-vep-pipeline us-east-1 S3 Bucket https://hail-vep-pipeline.public.tennex.io/ https://www.tennex.io/contact [Tennex](https://www.tennex.io/) New packages are added as soon as they are available and confirmed to work with [VEP](https://uswest.ensembl.org/info/about/publications.html) use is governed b aws-pds, genome wide association study, genomic, life sciences, vep, loftee -Vermont Open Geospatial on AWS Imagery datsets are organized in this bucket as statewide file mosaics and by ac arn:aws:s3:::vtopendata-prd/Imagery us-east-2 S3 Bucket https://vcgi.vermont.gov/data-and-programs/ If you have specific questions please contact - vcgi@vermont.gov [Vermont Center for Geographic Information](https://vcgi.vermont.gov) Vermont acquires statewide imagery approximately once every other year. Lidar is Public Domain with Attribution earth observation, aerial imagery, geospatial, lidar, elevation, land cover False Vermont Open Geospatial on AWS Landcover datsets are organized in this bucket as statewide file mosaics These arn:aws:s3:::vtopendata-prd/Landcover us-east-2 S3 Bucket https://vcgi.vermont.gov/data-and-programs/ If you have specific questions please contact - vcgi@vermont.gov [Vermont Center for Geographic Information](https://vcgi.vermont.gov) Vermont acquires statewide imagery approximately once every other year. Lidar is Public Domain with Attribution earth observation, aerial imagery, geospatial, lidar, elevation, land cover False +Vermont Open Geospatial on AWS Imagery datsets are organized in this bucket as statewide file mosaics and by ac arn:aws:s3:::vtopendata-prd/Imagery us-east-2 S3 Bucket https://vcgi.vermont.gov/data-and-programs/ If you have specific questions please contact - vcgi@vermont.gov [Vermont Center for Geographic Information](https://vcgi.vermont.gov) Vermont acquires statewide imagery approximately once every other year. Lidar is Public Domain with Attribution earth observation, aerial imagery, geospatial, lidar, elevation, land cover False Vermont Open Geospatial on AWS Elevation datsets (primarily lidar based) are organized in this bucket as statew arn:aws:s3:::vtopendata-prd/Elevation us-east-2 S3 Bucket https://vcgi.vermont.gov/data-and-programs/ If you have specific questions please contact - vcgi@vermont.gov [Vermont Center for Geographic Information](https://vcgi.vermont.gov) Vermont acquires statewide imagery approximately once every other year. Lidar is Public Domain with Attribution earth observation, aerial imagery, geospatial, lidar, elevation, land cover False Virginia Coastal Resilience Master Plan, Phase 1 - December 2021 Data Product List See readmetxt file for more information on the folder struc arn:aws:s3:::vadcr-frp us-east-1 S3 Bucket https://www.dcr.virginia.gov/crmp/ flood.resilience@dcr.virginia.gov [Virginia Department of Conservation and Recreation](https://www.dcr.virginia.go Every 5 years or as data becomes available Conditions of Release - Data is available by permission of the Virginia Departme aws-pds, coastal, floods ['[Browse Data](https://vadcr-frp.s3.us-east-1.amazonaws.com/index.html)'] Virtual Shizuoka, 3D Point Cloud Data Point Cloud Data of Shizuoka Prefecture, Japan arn:aws:s3:::virtual-shizuoka ap-northeast-1 S3 Bucket https://github.com/aigidjp/opendata_virtualshizuoka/README.md virtualshizuoka@aigid.jp [AIGID](https://aigid.jp/) Currently not scheduled Creative Commons Attribution 4.0 International (CC-BY 4.0) and Open Data Commons aws-pds, bathymetry, disaster response, elevation, geospatial, japanese, land, lidar, mapping @@ -1189,31 +1190,31 @@ Whiffle WINS50 Open Data on AWS Whiffle WINS50 LES Data arn:aws:s3:::whiffle-win WikiSum: Coherent Summarization Dataset for Efficient Human-Evaluation WikiSum Dataset arn:aws:s3:::wikisum us-east-1 S3 Bucket https://wikisum.s3.amazonaws.com/README.txt nachshon@amazon.com, orenk@amazon.com [Amazon](https://www.amazon.com/) Not currently being updated Dataset is published under [CC-NC-SA-3.0](https://creativecommons.org/licenses/b amazon.science, natural language processing, machine learning ['[wikisum.zip](https://wikisum.s3.amazonaws.com/WikiSumDataset.zip)', '[wikisum-human-eval.zip](https://wikisum.s3.amazonaws.com/HumanEvaluation.zip)'] Will Two Do? Varying Dimensions in Electrocardiography: The PhysioNet/Computing in Cardiology Challenge 2021 https://doiorg/1013026/34va-7q14 arn:aws:s3:::physionet-open/challenge-2021/ us-east-1 S3 Bucket https://doi.org/10.13026/34va-7q14 https://physionet.org/about/#contact_us [PhysioNet](https://physionet.org/) Not updated Creative Commons Attribution 4.0 International Public License aws-pds Wind AI Bench Wind AI Bench Flow Redirection and Induction in Steady State (FLORIS) Wind Plant arn:aws:s3:::nrel-pds-windai/wind_plant_power/floris/ us-west-2 S3 Bucket https://github.com/NREL/windAI_bench Ryan King (ryan.king@nrel.gov) [National Renewable Energy Laboratory](https://www.nrel.gov/) Annually Creative Commons Attribution 4.0 United States License aws-pds, energy, benchmark, machine learning ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-windai&prefix=wind_plant_power%2Ffloris%2F)'] -Wind AI Bench Wind AI Bench Airfoil Computational Fluid Dynamics (CFD) - 9k Shapes Data Sets arn:aws:s3:::nrel-pds-windai/aerodynamic_shapes/2D/9K_airfoils/ us-west-2 S3 Bucket https://github.com/NREL/windAI_bench Ryan King (ryan.king@nrel.gov) [National Renewable Energy Laboratory](https://www.nrel.gov/) Annually Creative Commons Attribution 4.0 United States License aws-pds, energy, benchmark, machine learning ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-windai&prefix=aerodynamic_shapes%2F2D%2F9k_airfoils%2F)'] Wind AI Bench Wind AI Bench Airfoil Computational Fluid Dynamics (CFD) - 2k Shapes Data Sets arn:aws:s3:::nrel-pds-windai/aerodynamic_shapes/2D/2K_airfoils/ us-west-2 S3 Bucket https://github.com/NREL/windAI_bench Ryan King (ryan.king@nrel.gov) [National Renewable Energy Laboratory](https://www.nrel.gov/) Annually Creative Commons Attribution 4.0 United States License aws-pds, energy, benchmark, machine learning ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-windai&prefix=aerodynamic_shapes%2F2D%2F2k_airfoils%2F)'] +Wind AI Bench Wind AI Bench Airfoil Computational Fluid Dynamics (CFD) - 9k Shapes Data Sets arn:aws:s3:::nrel-pds-windai/aerodynamic_shapes/2D/9K_airfoils/ us-west-2 S3 Bucket https://github.com/NREL/windAI_bench Ryan King (ryan.king@nrel.gov) [National Renewable Energy Laboratory](https://www.nrel.gov/) Annually Creative Commons Attribution 4.0 United States License aws-pds, energy, benchmark, machine learning ['[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-windai&prefix=aerodynamic_shapes%2F2D%2F9k_airfoils%2F)'] Wizard of Tasks Wizard of Tasks Dataset arn:aws:s3:::wizard-of-tasks us-west-2 S3 Bucket https://wizard-of-tasks.s3.us-west-2.amazonaws.com/README.md giusecas@amazon.com [Amazon](https://www.amazon.com/) Not currently being updated [cc-by-sa 4.0](https://creativecommons.org/licenses/by-sa/4.0/) conversation data, dialog, amazon.science, natural language processing, machine learning ['[wizard_of_tasks_cooking_v1.0.json](https://wizard-of-tasks.s3.us-west-2.amazonaws.com/wizard_of_tasks_cooking_v1.0.json)', '[wizard_of_tasks_diy_v1.0.json](https://wizard-of-tasks.s3.us-west-2.amazonaws.com/wizard_of_tasks_diy_v1.0.json)'] World Bank - Light Every Night Light Every Night dataset of all VIIRS DNB and DMSP-OLS nighttime satellite data arn:aws:s3:::globalnightlight us-east-1 S3 Bucket https://worldbank.github.io/OpenNightLights/wb-light-every-night-readme.html Trevor Monroe tmonroe@worldbank.org; Benjamin P. Stewart bstewart@worldbankgroup [World Bank Group](https://www.worldbank.org/en/home) Quarterly [World Bank Open Database License (ODbL)](https://creativecommons.org/licenses/b disaster response, earth observation, satellite imagery, aws-pds, stac, cog ['[STAC 1.0.0-beta.2 endpoint](https://stacindex.org/catalogs/world-bank-light-every-night#/)'] World Bank Climate Change Knowledge Portal (CCKP) World Bank Climate Change Knowledge Portal observed and projected climate datase arn:aws:s3:::wbg-cckp us-west-2 S3 Bucket https://worldbank.github.io/climateknowledgeportal C. MacKenzie Dove cdove@worldbank.org; askclimate@worldbank.org [World Bank Group](https://www.worldbank.org/en/home) Semi-annually [World Bank Open Database License (ODbL)](https://creativecommons.org/licenses/b aws-pds, climate, climate model, earth observation, climate projections, CMIP6, netcdf Xiph.Org Test Media Video and imagery data arn:aws:s3:::xiph-media us-east-1 S3 Bucket https://media.xiph.org/aws.html Thomas Daede tdaede@xiph.org [Xiph.org](https://xiph.org/) New videos are added when contributors submit them. Various. Most are under the CC-BY license. License text accompanies each sequenc aws-pds, computer vision, image processing, imaging, media, movies, multimedia, video Yale-CMU-Berkeley (YCB) Object and Model Set Project data files arn:aws:s3:::ycb-benchmarks us-east-1 S3 Bucket http://www.ycbbenchmarks.com/ bcalli@wpi.edu Yale University and Berkeley Yearly Creative Commons Attribution 4.0 International (CC BY 4.0) aws-pds, robotics ['[Browse Bucket](https://ycb-benchmarks.s3.amazonaws.com/index.html)'] -YouTube 8 Million - Data Lakehouse Ready Original YT8M *tfrecords File structure info can be found here arn:aws:s3:::aws-roda-ml-datalake/yt8m/ us-west-2 S3 Bucket https://github.com/aws-samples/data-lake-as-code/blob/roda-ml/docs/roda_install. https://github.com/aws-samples/data-lake-as-code/issues [Amazon Web Services](https://aws.amazon.com/) Google Research has not updated the dataset since 2019. https://github.com/aws-samples/data-lake-as-code/blob/roda-ml/docs/roda_attribut amazon.science, computer vision, machine learning, labeled, parquet, video YouTube 8 Million - Data Lakehouse Ready Lakehouse ready YT8M as Glue Parquet files Install instructions here arn:aws:s3:::aws-roda-ml-datalake/yt8m_ods/ us-west-2 S3 Bucket https://github.com/aws-samples/data-lake-as-code/blob/roda-ml/docs/roda_install. https://github.com/aws-samples/data-lake-as-code/issues [Amazon Web Services](https://aws.amazon.com/) Google Research has not updated the dataset since 2019. https://github.com/aws-samples/data-lake-as-code/blob/roda-ml/docs/roda_attribut amazon.science, computer vision, machine learning, labeled, parquet, video YouTube 8 Million - Data Lakehouse Ready Replica of the two locations above in us-east-1 arn:aws:s3:::aws-roda-ml-datalake-us-east-1/ us-east-1 S3 Bucket https://github.com/aws-samples/data-lake-as-code/blob/roda-ml/docs/roda_install. https://github.com/aws-samples/data-lake-as-code/issues [Amazon Web Services](https://aws.amazon.com/) Google Research has not updated the dataset since 2019. https://github.com/aws-samples/data-lake-as-code/blob/roda-ml/docs/roda_attribut amazon.science, computer vision, machine learning, labeled, parquet, video +YouTube 8 Million - Data Lakehouse Ready Original YT8M *tfrecords File structure info can be found here arn:aws:s3:::aws-roda-ml-datalake/yt8m/ us-west-2 S3 Bucket https://github.com/aws-samples/data-lake-as-code/blob/roda-ml/docs/roda_install. https://github.com/aws-samples/data-lake-as-code/issues [Amazon Web Services](https://aws.amazon.com/) Google Research has not updated the dataset since 2019. https://github.com/aws-samples/data-lake-as-code/blob/roda-ml/docs/roda_attribut amazon.science, computer vision, machine learning, labeled, parquet, video ZEST: ZEroShot learning from Task descriptions Project data files in a public bucket arn:aws:s3:::ai2-public-datasets/zest/ us-west-2 S3 Bucket https://allenai.org/data/zest info@allenai.org [Allen Institute for AI](https://allenai.org) Not updated [CC BY](https://creativecommons.org/licenses/by/4.0) aws-pds, machine learning, natural language processing ZINC Database 3D molecular docking structure files in db2gz, sdf and mol2 formats arn:aws:s3:::zinc3d us-east-1 S3 Bucket http://wiki.docking.org/index.php/ZINC15:Resources [John Irwin](chemistry4biology@gmail.com) [John Irwin](chemistry4biology@gmail.com) Monthly ZINC is free as in beer. You may not redistribute without the written permission aws-pds, life sciences, biology, chemical biology, pharmaceutical, molecular docking, protein iHART Whole Genome Sequencing Data Set gVCF and VCF files from The iHART whole genome sequencing study, control data se arn:aws:s3:::ihart-brain us-east-1 S3 Bucket http://www.ihart.org/data ihart2-org@stanford.edu [Stanford University](https://wall-lab.stanford.edu/projects/ihart/) The dataset may be updated with additional or corrected data on a need-to-update Data use is subject to the access and publication polices of the iHART. More inf aws-pds, autism spectrum disorder, genetic, genomic, life sciences, whole genome sequencing, bam, vcf http://www.ihart.org/access +iHART Whole Genome Sequencing Data Set gVCF and VCF files from The iHART whole genome sequencing study, control data se arn:aws:s3:::ihart-psp us-east-1 S3 Bucket http://www.ihart.org/data ihart2-org@stanford.edu [Stanford University](https://wall-lab.stanford.edu/projects/ihart/) The dataset may be updated with additional or corrected data on a need-to-update Data use is subject to the access and publication polices of the iHART. More inf aws-pds, autism spectrum disorder, genetic, genomic, life sciences, whole genome sequencing, bam, vcf http://www.ihart.org/access iHART Whole Genome Sequencing Data Set Cram, gVCF, and VCF files from The iHART whole genome sequencing study, Phase I+ arn:aws:s3:::ihart-hg38 us-east-1 S3 Bucket http://www.ihart.org/data ihart2-org@stanford.edu [Stanford University](https://wall-lab.stanford.edu/projects/ihart/) The dataset may be updated with additional or corrected data on a need-to-update Data use is subject to the access and publication polices of the iHART. More inf aws-pds, autism spectrum disorder, genetic, genomic, life sciences, whole genome sequencing, bam, vcf http://www.ihart.org/access iHART Whole Genome Sequencing Data Set BAM, gVCF, and VCF files from The iHART whole genome sequencing study, Phase II arn:aws:s3:::ihart-main us-east-1 S3 Bucket http://www.ihart.org/data ihart2-org@stanford.edu [Stanford University](https://wall-lab.stanford.edu/projects/ihart/) The dataset may be updated with additional or corrected data on a need-to-update Data use is subject to the access and publication polices of the iHART. More inf aws-pds, autism spectrum disorder, genetic, genomic, life sciences, whole genome sequencing, bam, vcf http://www.ihart.org/access iHART Whole Genome Sequencing Data Set BAM, gVCF, and VCF files from The iHART whole genome sequencing study, Phase I arn:aws:s3:::ihart-release us-east-1 S3 Bucket http://www.ihart.org/data ihart2-org@stanford.edu [Stanford University](https://wall-lab.stanford.edu/projects/ihart/) The dataset may be updated with additional or corrected data on a need-to-update Data use is subject to the access and publication polices of the iHART. More inf aws-pds, autism spectrum disorder, genetic, genomic, life sciences, whole genome sequencing, bam, vcf http://www.ihart.org/access -iHART Whole Genome Sequencing Data Set gVCF and VCF files from The iHART whole genome sequencing study, control data se arn:aws:s3:::ihart-psp us-east-1 S3 Bucket http://www.ihart.org/data ihart2-org@stanford.edu [Stanford University](https://wall-lab.stanford.edu/projects/ihart/) The dataset may be updated with additional or corrected data on a need-to-update Data use is subject to the access and publication polices of the iHART. More inf aws-pds, autism spectrum disorder, genetic, genomic, life sciences, whole genome sequencing, bam, vcf http://www.ihart.org/access iNaturalist Licensed Observation Images Image files (eg JPEG) associated with metadata describing the observation asso arn:aws:s3:::inaturalist-open-data us-east-1 S3 Bucket "Documentation can be found