Skip to content

Commit 5fddd8e

Browse files
committed
Updated datasets 2025-07-19 UTC
1 parent 99b361a commit 5fddd8e

8 files changed

Lines changed: 6394 additions & 42678 deletions

aws_geo_datasets.json

Lines changed: 115 additions & 29 deletions
Original file line numberDiff line numberDiff line change
@@ -1724,6 +1724,32 @@
17241724
"AccountRequired": null,
17251725
"Host": null
17261726
},
1727+
{
1728+
"Name": "CarbonPDF",
1729+
"Description": "A component-level product carbon footprint dataset and a corresponding question-answering dataset based on it",
1730+
"ARN": "arn:aws:s3:::carbonpdf",
1731+
"Region": "us-east-1",
1732+
"Type": "S3 Bucket",
1733+
"Documentation": "https://github.com/pittcps/carbonpdf-dataset",
1734+
"Contact": "kaz81@pitt.edu",
1735+
"ManagedBy": "Pittcps lab",
1736+
"UpdateFrequency": "Data for a new company is added once collected.",
1737+
"License": "CC BY 4.0 (https://creativecommons.org/licenses/by/4.0/)",
1738+
"Tags": [
1739+
"aws-pds",
1740+
"environmental",
1741+
"product comparison",
1742+
"csv",
1743+
"information retrieval",
1744+
"industry"
1745+
],
1746+
"Explore": [
1747+
"[Explore](https://github.com/pittcps/carbonpdf-dataset)"
1748+
],
1749+
"RequesterPays": null,
1750+
"AccountRequired": null,
1751+
"Host": null
1752+
},
17271753
{
17281754
"Name": "Central Weather Administration OpenData",
17291755
"Description": "CWA data lake",
@@ -6483,9 +6509,9 @@
64836509
{
64846510
"Name": "Global Biodiversity Information Facility (GBIF) Species Occurrences - GBIF species occurrence data in Parquet format (af-south-1 region)",
64856511
"Description": "GBIF species occurrence data in Parquet format (af-south-1 region)",
6486-
"ARN": "arn:aws:sns:af-south-1:288719126026:gbif-open-data-af-south-1-object_created",
6512+
"ARN": "arn:aws:s3:::gbif-open-data-af-south-1",
64876513
"Region": "af-south-1",
6488-
"Type": "SNS Topic",
6514+
"Type": "S3 Bucket",
64896515
"Documentation": "Documentation can be found [here](https://github.com/gbif/occurrence/blob/master/aws-public-data.md). You can learn more about GBIF [here](https://www.gbif.org).",
64906516
"Contact": "helpdesk@gbif.org",
64916517
"ManagedBy": "The Global Biodiversity Information Facility ([GBIF](https://www.gbif.org))",
@@ -6499,17 +6525,19 @@
64996525
"conservation",
65006526
"life sciences"
65016527
],
6502-
"Explore": null,
6528+
"Explore": [
6529+
"[Browse bucket](https://gbif-open-data-af-south-1.s3.af-south-1.amazonaws.com/index.html)"
6530+
],
65036531
"RequesterPays": null,
65046532
"AccountRequired": null,
65056533
"Host": null
65066534
},
65076535
{
65086536
"Name": "Global Biodiversity Information Facility (GBIF) Species Occurrences - GBIF species occurrence data in Parquet format (af-south-1 region)",
65096537
"Description": "GBIF species occurrence data in Parquet format (af-south-1 region)",
6510-
"ARN": "arn:aws:s3:::gbif-open-data-af-south-1",
6538+
"ARN": "arn:aws:sns:af-south-1:288719126026:gbif-open-data-af-south-1-object_created",
65116539
"Region": "af-south-1",
6512-
"Type": "S3 Bucket",
6540+
"Type": "SNS Topic",
65136541
"Documentation": "Documentation can be found [here](https://github.com/gbif/occurrence/blob/master/aws-public-data.md). You can learn more about GBIF [here](https://www.gbif.org).",
65146542
"Contact": "helpdesk@gbif.org",
65156543
"ManagedBy": "The Global Biodiversity Information Facility ([GBIF](https://www.gbif.org))",
@@ -6523,9 +6551,7 @@
65236551
"conservation",
65246552
"life sciences"
65256553
],
6526-
"Explore": [
6527-
"[Browse bucket](https://gbif-open-data-af-south-1.s3.af-south-1.amazonaws.com/index.html)"
6528-
],
6554+
"Explore": null,
65296555
"RequesterPays": null,
65306556
"AccountRequired": null,
65316557
"Host": null
@@ -6583,9 +6609,9 @@
65836609
{
65846610
"Name": "Global Biodiversity Information Facility (GBIF) Species Occurrences - GBIF species occurrence data in Parquet format (eu-central-1 region)",
65856611
"Description": "GBIF species occurrence data in Parquet format (eu-central-1 region)",
6586-
"ARN": "arn:aws:s3:::gbif-open-data-eu-central-1",
6612+
"ARN": "arn:aws:sns:af-south-1:288719126026:gbif-open-data-eu-central-1-object_created",
65876613
"Region": "eu-central-1",
6588-
"Type": "S3 Bucket",
6614+
"Type": "SNS Topic",
65896615
"Documentation": "Documentation can be found [here](https://github.com/gbif/occurrence/blob/master/aws-public-data.md). You can learn more about GBIF [here](https://www.gbif.org).",
65906616
"Contact": "helpdesk@gbif.org",
65916617
"ManagedBy": "The Global Biodiversity Information Facility ([GBIF](https://www.gbif.org))",
@@ -6599,19 +6625,17 @@
65996625
"conservation",
66006626
"life sciences"
66016627
],
6602-
"Explore": [
6603-
"[Browse bucket](https://gbif-open-data-eu-central-1.s3.eu-central-1.amazonaws.com/index.html)"
6604-
],
6628+
"Explore": null,
66056629
"RequesterPays": null,
66066630
"AccountRequired": null,
66076631
"Host": null
66086632
},
66096633
{
66106634
"Name": "Global Biodiversity Information Facility (GBIF) Species Occurrences - GBIF species occurrence data in Parquet format (eu-central-1 region)",
66116635
"Description": "GBIF species occurrence data in Parquet format (eu-central-1 region)",
6612-
"ARN": "arn:aws:sns:af-south-1:288719126026:gbif-open-data-eu-central-1-object_created",
6636+
"ARN": "arn:aws:s3:::gbif-open-data-eu-central-1",
66136637
"Region": "eu-central-1",
6614-
"Type": "SNS Topic",
6638+
"Type": "S3 Bucket",
66156639
"Documentation": "Documentation can be found [here](https://github.com/gbif/occurrence/blob/master/aws-public-data.md). You can learn more about GBIF [here](https://www.gbif.org).",
66166640
"Contact": "helpdesk@gbif.org",
66176641
"ManagedBy": "The Global Biodiversity Information Facility ([GBIF](https://www.gbif.org))",
@@ -6625,17 +6649,19 @@
66256649
"conservation",
66266650
"life sciences"
66276651
],
6628-
"Explore": null,
6652+
"Explore": [
6653+
"[Browse bucket](https://gbif-open-data-eu-central-1.s3.eu-central-1.amazonaws.com/index.html)"
6654+
],
66296655
"RequesterPays": null,
66306656
"AccountRequired": null,
66316657
"Host": null
66326658
},
66336659
{
66346660
"Name": "Global Biodiversity Information Facility (GBIF) Species Occurrences - GBIF species occurrence data in Parquet format (sa-east-1 region)",
66356661
"Description": "GBIF species occurrence data in Parquet format (sa-east-1 region)",
6636-
"ARN": "arn:aws:sns:af-south-1:288719126026:gbif-open-data-sa-east-1-object_created",
6662+
"ARN": "arn:aws:s3:::gbif-open-data-sa-east-1",
66376663
"Region": "sa-east-1",
6638-
"Type": "SNS Topic",
6664+
"Type": "S3 Bucket",
66396665
"Documentation": "Documentation can be found [here](https://github.com/gbif/occurrence/blob/master/aws-public-data.md). You can learn more about GBIF [here](https://www.gbif.org).",
66406666
"Contact": "helpdesk@gbif.org",
66416667
"ManagedBy": "The Global Biodiversity Information Facility ([GBIF](https://www.gbif.org))",
@@ -6649,17 +6675,19 @@
66496675
"conservation",
66506676
"life sciences"
66516677
],
6652-
"Explore": null,
6678+
"Explore": [
6679+
"[Browse bucket](https://gbif-open-data-sa-east-1.s3.sa-east-1.amazonaws.com/index.html)"
6680+
],
66536681
"RequesterPays": null,
66546682
"AccountRequired": null,
66556683
"Host": null
66566684
},
66576685
{
66586686
"Name": "Global Biodiversity Information Facility (GBIF) Species Occurrences - GBIF species occurrence data in Parquet format (sa-east-1 region)",
66596687
"Description": "GBIF species occurrence data in Parquet format (sa-east-1 region)",
6660-
"ARN": "arn:aws:s3:::gbif-open-data-sa-east-1",
6688+
"ARN": "arn:aws:sns:af-south-1:288719126026:gbif-open-data-sa-east-1-object_created",
66616689
"Region": "sa-east-1",
6662-
"Type": "S3 Bucket",
6690+
"Type": "SNS Topic",
66636691
"Documentation": "Documentation can be found [here](https://github.com/gbif/occurrence/blob/master/aws-public-data.md). You can learn more about GBIF [here](https://www.gbif.org).",
66646692
"Contact": "helpdesk@gbif.org",
66656693
"ManagedBy": "The Global Biodiversity Information Facility ([GBIF](https://www.gbif.org))",
@@ -6673,9 +6701,7 @@
66736701
"conservation",
66746702
"life sciences"
66756703
],
6676-
"Explore": [
6677-
"[Browse bucket](https://gbif-open-data-sa-east-1.s3.sa-east-1.amazonaws.com/index.html)"
6678-
],
6704+
"Explore": null,
66796705
"RequesterPays": null,
66806706
"AccountRequired": null,
66816707
"Host": null
@@ -13076,7 +13102,7 @@
1307613102
{
1307713103
"Name": "NOAA Joint Polar Satellite System (JPSS) - New data notifications for JPSS data, only Lambda and SQS protocols allowed",
1307813104
"Description": "New data notifications for JPSS data, only Lambda and SQS protocols allowed",
13079-
"ARN": "arn:aws:sns:us-east-1:709902155096:NewSNPPObject",
13105+
"ARN": "arn:aws:sns:us-east-1:709902155096:NewNOAA20Object",
1308013106
"Region": "us-east-1",
1308113107
"Type": "SNS Topic",
1308213108
"Documentation": "https://github.com/NOAA-Big-Data-Program/bdp-data-docs/tree/main/JPSS",
@@ -13122,7 +13148,7 @@
1312213148
{
1312313149
"Name": "NOAA Joint Polar Satellite System (JPSS) - New data notifications for JPSS data, only Lambda and SQS protocols allowed",
1312413150
"Description": "New data notifications for JPSS data, only Lambda and SQS protocols allowed",
13125-
"ARN": "arn:aws:sns:us-east-1:709902155096:NewJPSSObject",
13151+
"ARN": "arn:aws:sns:us-east-1:709902155096:NewSNPPObject",
1312613152
"Region": "us-east-1",
1312713153
"Type": "SNS Topic",
1312813154
"Documentation": "https://github.com/NOAA-Big-Data-Program/bdp-data-docs/tree/main/JPSS",
@@ -13145,7 +13171,7 @@
1314513171
{
1314613172
"Name": "NOAA Joint Polar Satellite System (JPSS) - New data notifications for JPSS data, only Lambda and SQS protocols allowed",
1314713173
"Description": "New data notifications for JPSS data, only Lambda and SQS protocols allowed",
13148-
"ARN": "arn:aws:sns:us-east-1:709902155096:NewNOAA20Object",
13174+
"ARN": "arn:aws:sns:us-east-1:709902155096:NewJPSSObject",
1314913175
"Region": "us-east-1",
1315013176
"Type": "SNS Topic",
1315113177
"Documentation": "https://github.com/NOAA-Big-Data-Program/bdp-data-docs/tree/main/JPSS",
@@ -14573,7 +14599,7 @@
1457314599
{
1457414600
"Name": "NOAA U.S. Climate Gridded Dataset (NClimGrid) - New data notifications for Daily NClimGrid, only Lambda and SQS protocols allowed",
1457514601
"Description": "New data notifications for Daily NClimGrid, only Lambda and SQS protocols allowed",
14576-
"ARN": "arn:aws:sns:us-east-1:123901341784:NewNClimGridMonthlyObject",
14602+
"ARN": "arn:aws:sns:us-east-1:123901341784:NewNClimGridDailyObject",
1457714603
"Region": "us-east-1",
1457814604
"Type": "SNS Topic",
1457914605
"Documentation": "https://www.ncei.noaa.gov/access/metadata/landing-page/bin/iso?id=gov.noaa.ncdc:C00332",
@@ -14596,7 +14622,7 @@
1459614622
{
1459714623
"Name": "NOAA U.S. Climate Gridded Dataset (NClimGrid) - New data notifications for Daily NClimGrid, only Lambda and SQS protocols allowed",
1459814624
"Description": "New data notifications for Daily NClimGrid, only Lambda and SQS protocols allowed",
14599-
"ARN": "arn:aws:sns:us-east-1:123901341784:NewNClimGridDailyObject",
14625+
"ARN": "arn:aws:sns:us-east-1:123901341784:NewNClimGridMonthlyObject",
1460014626
"Region": "us-east-1",
1460114627
"Type": "SNS Topic",
1460214628
"Documentation": "https://www.ncei.noaa.gov/access/metadata/landing-page/bin/iso?id=gov.noaa.ncdc:C00332",
@@ -16451,6 +16477,30 @@
1645116477
"AccountRequired": null,
1645216478
"Host": null
1645316479
},
16480+
{
16481+
"Name": "NREL Wind Integration National Dataset - Super-Resolution for Renewable Energy Resource Data with Wind from Reanalysis (Sup3rWind)",
16482+
"Description": "Super-Resolution for Renewable Energy Resource Data with Wind from Reanalysis (Sup3rWind)",
16483+
"ARN": "arn:aws:s3:::nrel-pds-wtk/sup3rwind/",
16484+
"Region": "us-west-2",
16485+
"Type": "S3 Bucket",
16486+
"Documentation": "https://www.nrel.gov/grid/wind-toolkit.html",
16487+
"Contact": "wind-toolkit@nrel.gov",
16488+
"ManagedBy": "[National Renewable Energy Laboratory](https://www.nrel.gov/)",
16489+
"UpdateFrequency": "As Needed",
16490+
"License": "Creative Commons Attribution 3.0 United States License",
16491+
"Tags": [
16492+
"aws-pds",
16493+
"environmental",
16494+
"geospatial",
16495+
"meteorological"
16496+
],
16497+
"Explore": [
16498+
"[Browse Dataset](https://data.openei.org/s3_viewer?bucket=nrel-pds-wtk&prefix=sup3rwind%2F)"
16499+
],
16500+
"RequesterPays": null,
16501+
"AccountRequired": null,
16502+
"Host": null
16503+
},
1645416504
{
1645516505
"Name": "NREL Wind Integration National Dataset - Techno-economic subset of the WIND Toolkit by location in netCDF",
1645616506
"Description": "Techno-economic subset of the WIND Toolkit by location in netCDF",
@@ -19274,6 +19324,42 @@
1927419324
"AccountRequired": null,
1927519325
"Host": null
1927619326
},
19327+
{
19328+
"Name": "Sanborn Maps Data Package",
19329+
"Description": "Sanborn Maps data",
19330+
"ARN": "arn:aws:s3:::loc-sanborn-maps",
19331+
"Region": "us-west-2",
19332+
"Type": "S3 Bucket",
19333+
"Documentation": "https://data.labs.loc.gov/sanborn/",
19334+
"Contact": "For curatorial questions about the content of the collection and formats, contact the Library of Congress Geography and Map Division at https://ask.loc.gov/map-geography. For technical questions about access, contact LC-Labs@loc.gov",
19335+
"ManagedBy": "[Library of Congress](https://www.loc.gov/)",
19336+
"UpdateFrequency": "As new and significant changes to the underlying digital collection occurs",
19337+
"License": "The content of the Library of Congress online Sanborn Maps Collection is in the public domain and is free to use and reuse. For more information, see https://www.loc.gov/collections/sanborn-maps/about-this-collection/rights-and-access/.",
19338+
"Tags": [
19339+
"aws-pds",
19340+
"archives",
19341+
"cities",
19342+
"computer vision",
19343+
"conservation",
19344+
"culture",
19345+
"cultural preservation",
19346+
"demographics",
19347+
"digital assets",
19348+
"geospatial",
19349+
"history",
19350+
"housing",
19351+
"land use",
19352+
"mapping",
19353+
"urban"
19354+
],
19355+
"Explore": [
19356+
"[Browse Bucket by State](https://loc-sanborn-maps.s3.amazonaws.com/maps-by-state/index.html)",
19357+
"[README](https://loc-sanborn-maps.s3.amazonaws.com/README.html)"
19358+
],
19359+
"RequesterPays": null,
19360+
"AccountRequired": null,
19361+
"Host": null
19362+
},
1927719363
{
1927819364
"Name": "SatPM2.5",
1927919365
"Description": "Satellite-Derived Fine Particulate Matter (PM25) concentrations from the Atmospheric Composition Analysis Group and Washington University in St Louis, version GL060204",

0 commit comments

Comments
 (0)