diff --git a/README.md b/README.md index 0fd946392..8d6bb487a 100644 --- a/README.md +++ b/README.md @@ -31,10 +31,21 @@ Resources: Region: Type: DataAtWork: - - Title: - URL: - AuthorName: - AuthorURL: + Tutorials: + - Title: + URL: + AuthorName: + AuthorURL: + Tools & Applications: + - Title: + URL: + AuthorName: + AuthorURL: + Publications: + - Title: + URL: + AuthorName: + AuthorURL: ``` The metadata required for each dataset entry is as follows: @@ -93,22 +104,23 @@ Resources: Region: us-east-1 Type: SNS Topic DataAtWork: - - Title: Exploring GDELT with Athena - URL: http://blog.julien.org/2017/03/exploring-gdelt-data-set-with-amazon.html - AuthorName: Julien Simon - AuthorURL: https://twitter.com/julsimon - - Title: Running R on Amazon Athena - URL: https://aws.amazon.com/blogs/big-data/running-r-on-amazon-athena/ - AuthorName: Gopal Wunnava - AuthorURL: https://www.linkedin.com/in/gopal-wunnava-b11a77/ - - Title: Bootstrapping GeoMesa HBase on AWS S3 - URL: http://www.geomesa.org/documentation/tutorials/geomesa-hbase-s3-on-aws.html - AuthorName: Commonwealth Computer Research, Inc. - AuthorURL: https://www.ccri.com - - Title: Creating PySpark DataFrame from CSV in AWS S3 in EMR - URL: https://gist.github.com/jakechen/6955f2de51212163312b6430555b8e0b - AuthorName: Jake Chen - AuthorURL: https://github.com/jakechen + Tutorial: + - Title: Exploring GDELT with Athena + URL: http://blog.julien.org/2017/03/exploring-gdelt-data-set-with-amazon.html + AuthorName: Julien Simon + AuthorURL: https://twitter.com/julsimon + - Title: Running R on Amazon Athena + URL: https://aws.amazon.com/blogs/big-data/running-r-on-amazon-athena/ + AuthorName: Gopal Wunnava + AuthorURL: https://www.linkedin.com/in/gopal-wunnava-b11a77/ + - Title: Bootstrapping GeoMesa HBase on AWS S3 + URL: http://www.geomesa.org/documentation/tutorials/geomesa-hbase-s3-on-aws.html + AuthorName: Commonwealth Computer Research, Inc. + AuthorURL: https://www.ccri.com + - Title: Creating PySpark DataFrame from CSV in AWS S3 in EMR + URL: https://gist.github.com/jakechen/6955f2de51212163312b6430555b8e0b + AuthorName: Jake Chen + AuthorURL: https://github.com/jakechen ``` ## How can I contribute? diff --git a/datasets/1000-genomes.yaml b/datasets/1000-genomes.yaml index 54308466f..19d5b9c73 100644 --- a/datasets/1000-genomes.yaml +++ b/datasets/1000-genomes.yaml @@ -15,7 +15,10 @@ Resources: Region: us-east-1 Type: S3 Bucket DataAtWork: - - Title: Exploratory data analysis of genomic datasets using ADAM and Mango with Apache Spark on Amazon EMR - URL: https://aws.amazon.com/blogs/big-data/exploratory-data-analysis-of-genomic-datasets-using-adam-and-mango-with-apache-spark-on-amazon-emr/ - AuthorName: Alyssa Marrow - AuthorURL: https://research.eecs.berkeley.edu/~akmorrow/ + Tutorials: + Tools & Applications: + Publications: + - Title: Exploratory data analysis of genomic datasets using ADAM and Mango with Apache Spark on Amazon EMR + URL: https://aws.amazon.com/blogs/big-data/exploratory-data-analysis-of-genomic-datasets-using-adam-and-mango-with-apache-spark-on-amazon-emr/ + AuthorName: Alyssa Marrow + AuthorURL: https://research.eecs.berkeley.edu/~akmorrow/ diff --git a/datasets/3kricegenome.yaml b/datasets/3kricegenome.yaml index 99941f647..ed6c7aad4 100644 --- a/datasets/3kricegenome.yaml +++ b/datasets/3kricegenome.yaml @@ -16,3 +16,7 @@ Resources: ARN: arn:aws:s3:::3kricegenome Region: us-east-1 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: diff --git a/datasets/990-spreadsheets.yaml b/datasets/990-spreadsheets.yaml index 27c72272b..596a4e0b5 100644 --- a/datasets/990-spreadsheets.yaml +++ b/datasets/990-spreadsheets.yaml @@ -16,3 +16,7 @@ Resources: ARN: arn:aws:s3:::irs-990-spreadsheets Region: us-east-1 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: diff --git a/datasets/afsis.yaml b/datasets/afsis.yaml index 471a7cab7..a2bac33a5 100644 --- a/datasets/afsis.yaml +++ b/datasets/afsis.yaml @@ -1,6 +1,6 @@ Name: Africa Soil Information Service (AfSIS) Soil Chemistry Description: | - This dataset contains soil infrared spectral data and paired soil property + This dataset contains soil infrared spectral data and paired soil property reference measurements for georeferenced soil samples that were collected through the Africa Soil Information Service (AfSIS) project, which lasted from 2009 through 2018. In this release, we include data collected during @@ -34,11 +34,14 @@ Resources: Region: us-east-1 Type: S3 Bucket DataAtWork: - - Title: AfSIS Soil Chemistry - Usage Tutorial - URL: https://github.com/qedsoftware/afsis-soil-chem-tutorial/ - AuthorName: QED - AuthorURL: https://qed.ai - - Title: Goalkeepers 2018, Soil - The Big Data Beneath Your Feet - URL: https://www.youtube.com/watch?v=Fb9R0CnPMkc - AuthorName: QED - AuthorURL: https://qed.ai + Tutorials: + - Title: AfSIS Soil Chemistry - Usage Tutorial + URL: https://github.com/qedsoftware/afsis-soil-chem-tutorial/ + AuthorName: QED + AuthorURL: https://qed.ai + Tools & Applications: + Publications: + - Title: Goalkeepers 2018, Soil - The Big Data Beneath Your Feet + URL: https://www.youtube.com/watch?v=Fb9R0CnPMkc + AuthorName: QED + AuthorURL: https://qed.ai diff --git a/datasets/allen-brain-observatory.yaml b/datasets/allen-brain-observatory.yaml index 1a8c76681..0b899766f 100644 --- a/datasets/allen-brain-observatory.yaml +++ b/datasets/allen-brain-observatory.yaml @@ -23,7 +23,10 @@ Resources: Region: us-west-2 Type: S3 Bucket DataAtWork: - - Title: Use the Allen Brain Observatory – Visual Coding on AWS - URL: https://github.com/AllenInstitute/AllenSDK/wiki/Use-the-Allen-Brain-Observatory-%E2%80%93-Visual-Coding-on-AWS - AuthorName: Nika Keller, David Feng - AuthorURL: https://twitter.com/dyfbrain \ No newline at end of file + Tutorials: + - Title: Use the Allen Brain Observatory – Visual Coding on AWS + URL: https://github.com/AllenInstitute/AllenSDK/wiki/Use-the-Allen-Brain-Observatory-%E2%80%93-Visual-Coding-on-AWS + AuthorName: Nika Keller, David Feng + AuthorURL: https://twitter.com/dyfbrain + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/amazon-bin-imagery.yaml b/datasets/amazon-bin-imagery.yaml index aca306f38..c10aae243 100644 --- a/datasets/amazon-bin-imagery.yaml +++ b/datasets/amazon-bin-imagery.yaml @@ -15,11 +15,14 @@ Resources: Region: us-east-1 Type: S3 Bucket DataAtWork: - - Title: Amazon Bin Image Dataset Challenge - URL: https://github.com/silverbottlep/abid_challenge - AuthorName: silverbottlep - AuthorURL: https://github.com/silverbottlep - - Title: Amazon Inventory Reconciliation using AI - URL: https://github.com/OneNow/AI-Inventory-Reconciliation - AuthorName: Pablo Rodriguez Bertorello, Sravan Sripada, Nutchapol Dendumrongsup - AuthorURL: https://github.com/pablo-tech + Tutorials: + Tools & Applications: + Publications: + - Title: Amazon Bin Image Dataset Challenge + URL: https://github.com/silverbottlep/abid_challenge + AuthorName: silverbottlep + AuthorURL: https://github.com/silverbottlep + - Title: Amazon Inventory Reconciliation using AI + URL: https://github.com/OneNow/AI-Inventory-Reconciliation + AuthorName: Pablo Rodriguez Bertorello, Sravan Sripada, Nutchapol Dendumrongsup + AuthorURL: https://github.com/pablo-tech diff --git a/datasets/amazon-reviews.yaml b/datasets/amazon-reviews.yaml index 78bab8764..d067df453 100644 --- a/datasets/amazon-reviews.yaml +++ b/datasets/amazon-reviews.yaml @@ -16,15 +16,18 @@ Resources: Region: us-east-1 Type: S3 Bucket DataAtWork: - - Title: How to scale sentiment analysis using Amazon Comprehend, AWS Glue and Amazon Athena - URL: https://aws.amazon.com/blogs/machine-learning/how-to-scale-sentiment-analysis-using-amazon-comprehend-aws-glue-and-amazon-athena/ - AuthorName: Roy Hasson - AuthorURL: https://twitter.com/royhasson - - Title: Implementing a recommender system with Amazon SageMaker and Apache MXNet Gluon - URL: https://github.com/awslabs/amazon-sagemaker-examples/blob/master/introduction_to_applying_machine_learning/gluon_recommender_system/gluon_recommender_system.ipynb - AuthorName: David Arpin - AuthorURL: https://github.com/djarpin - - Title: Querying Review Data with Kognitio AWS Marketplace product using SQL - URL: https://www.linkedin.com/pulse/100-shades-grey-other-amazon-review-discoveries-mark-chopping/ - AuthorName: Mark Chopping - AuthorURL: https://twitter.com/markchopping1 + Tutorials: + - Title: How to scale sentiment analysis using Amazon Comprehend, AWS Glue and Amazon Athena + URL: https://aws.amazon.com/blogs/machine-learning/how-to-scale-sentiment-analysis-using-amazon-comprehend-aws-glue-and-amazon-athena/ + AuthorName: Roy Hasson + AuthorURL: https://twitter.com/royhasson + - Title: Implementing a recommender system with Amazon SageMaker and Apache MXNet Gluon + URL: https://github.com/awslabs/amazon-sagemaker-examples/blob/master/introduction_to_applying_machine_learning/gluon_recommender_system/gluon_recommender_system.ipynb + AuthorName: David Arpin + AuthorURL: https://github.com/djarpin + - Title: Querying Review Data with Kognitio AWS Marketplace product using SQL + URL: https://www.linkedin.com/pulse/100-shades-grey-other-amazon-review-discoveries-mark-chopping/ + AuthorName: Mark Chopping + AuthorURL: https://twitter.com/markchopping1 + Tools & Applications: + Publications: diff --git a/datasets/america-ninja-warrior.yaml b/datasets/america-ninja-warrior.yaml deleted file mode 100644 index d7224c76d..000000000 --- a/datasets/america-ninja-warrior.yaml +++ /dev/null @@ -1,22 +0,0 @@ -Name: American Ninja Warrior Obstacle History -Description: | - Obstacle history of American Ninja Warrior seasons 1-9 - This dataset includes every obstacle in the history of American Ninja Warrior from season 1 to 9. This includes the obstacles at Sasuke (also known as the original Ninja Warrior in Japan) during seasons 1-3 when American Ninja Warrior (ANW) was on G4, and the top 10 competitors from the semi-finals round of ANW were sent to Sasuke to compete. Starting in season 4 of ANW, which is known as the "NBC era" when the show took on the regional/city formats for both qualifying and semi-final rounds with the finalists from each region competing at the National Finals of ANW in Las Vegas. -Contact: https://data.world/ninja/anw-obstacle-history/discuss -Documentation: https://data.world/ninja/anw-obstacle-history -UpdateFrequency: Annually -Tags: - - multimedia - - events - - sports -License: CC-BY -Resources: - - Description: Project data files - ARN: arn:aws:s3:::dataworld-odaws-us-east-1/datasets/ninja/anw-obstacle-history/ - Region: us-east-1 - Type: S3 Bucket -DataAtWork: - - Title: Ninja Warrior obstacle data - URL: https://data.world/ninja/anw-obstacle-history - AuthorName: "@ninja on data.world" - AuthorURL: https://data.world/ninja \ No newline at end of file diff --git a/datasets/aws-igenomes.yaml b/datasets/aws-igenomes.yaml index dd1a30faa..46a9bbb53 100644 --- a/datasets/aws-igenomes.yaml +++ b/datasets/aws-igenomes.yaml @@ -16,7 +16,10 @@ Resources: Region: eu-west-1 Type: S3 Bucket DataAtWork: - - Title: nf-core analysis pipelines - URL: http://nf-co.re/ - AuthorName: Phil Ewels - AuthorURL: http://phil.ewels.co.uk/ + Tutorials: + Tools & Applications: + - Title: nf-core analysis pipelines + URL: http://nf-co.re/ + AuthorName: Phil Ewels + AuthorURL: http://phil.ewels.co.uk/ + Publications: diff --git a/datasets/broad-references.yaml b/datasets/broad-references.yaml index 8dcce4d1d..2bafb53d6 100644 --- a/datasets/broad-references.yaml +++ b/datasets/broad-references.yaml @@ -18,7 +18,10 @@ Resources: Region: us-east-1 Type: S3 Bucket DataAtWork: - - Title: Genomics Workflows on AWS - Cromwell on AWS - URL: https://docs.opendata.aws/genomics-workflows/orchestration/cromwell/cromwell-examples/#real-world-example-haplotypecaller - AuthorName: W. Lee Pang - AuthorURL: https://www.linkedin.com/in/lee-pang-a039a26/ + Tutorials: + Tools & Applications: + - Title: Genomics Workflows on AWS - Cromwell on AWS + URL: https://docs.opendata.aws/genomics-workflows/orchestration/cromwell/cromwell-examples/#real-world-example-haplotypecaller + AuthorName: W. Lee Pang + AuthorURL: https://www.linkedin.com/in/lee-pang-a039a26/ + Publications: diff --git a/datasets/cbers.yaml b/datasets/cbers.yaml index af10c05c6..35001bec1 100644 --- a/datasets/cbers.yaml +++ b/datasets/cbers.yaml @@ -53,38 +53,41 @@ Resources: Region: us-east-1 Type: SNS Topic DataAtWork: - - Title: STAC V0.7 search endpoint for archive - URL: https://stac.amskepler.com/v07/stac/search - AuthorName: AMS Kepler - AuthorURL: https://github.com/fredliporace/cbers-2-stac - - Title: Remote Pixel Viewer - URL: https://viewer.remotepixel.ca - AuthorName: Remote Pixel - AuthorURL: http://remotepixel.ca/ - - Title: EOS Land Viewer - URL: https://eos.com/landviewer/ - AuthorName: Earth Observing System - AuthorURL: https://eos.com/ - - Title: CBERS timelapse GIF generator - URL: https://github.com/fredliporace/cbersgif - AuthorName: Frederico Liporace - AuthorURL: https://github.com/fredliporace - - Title: aws-sat-api-py - URL: https://github.com/RemotePixel/aws-sat-api-py - AuthorName: Remote Pixel - AuthorURL: http://remotepixel.ca/ - - Title: rio-tiler - URL: https://github.com/mapbox/rio-tiler - AuthorName: Mapbox - AuthorURL: https://www.mapbox.com/ - - Title: cbers-tiler - URL: https://github.com/mapbox/cbers-tiler - AuthorName: Mapbox - AuthorURL: https://www.mapbox.com/ - - Title: CBERS static STAC catalog served by stac-browser - URL: https://cbers.stac.cloud - AuthorName: Radiant Earth - AuthorURL: https://github.com/radiantearth/stac-browser - - Title: Keeping a SpatioTemporal Asset Catalog (STAC) Up To Date with SNS/SQS - URL: https://aws.amazon.com/blogs/publicsector/keeping-a-spatiotemporal-asset-catalog-stac-up-to-date-with-sns-sqs/ - AuthorName: Frederico Liporace + Tutorials: + - Title: Keeping a SpatioTemporal Asset Catalog (STAC) Up To Date with SNS/SQS + URL: https://aws.amazon.com/blogs/publicsector/keeping-a-spatiotemporal-asset-catalog-stac-up-to-date-with-sns-sqs/ + AuthorName: Frederico Liporace + Tools & Applications: + - Title: STAC V0.7 search endpoint for archive + URL: https://stac.amskepler.com/v07/stac/search + AuthorName: AMS Kepler + AuthorURL: https://github.com/fredliporace/cbers-2-stac + - Title: Remote Pixel Viewer + URL: https://viewer.remotepixel.ca + AuthorName: Remote Pixel + AuthorURL: http://remotepixel.ca/ + - Title: EOS Land Viewer + URL: https://eos.com/landviewer/ + AuthorName: Earth Observing System + AuthorURL: https://eos.com/ + - Title: CBERS timelapse GIF generator + URL: https://github.com/fredliporace/cbersgif + AuthorName: Frederico Liporace + AuthorURL: https://github.com/fredliporace + - Title: aws-sat-api-py + URL: https://github.com/RemotePixel/aws-sat-api-py + AuthorName: Remote Pixel + AuthorURL: http://remotepixel.ca/ + - Title: rio-tiler + URL: https://github.com/mapbox/rio-tiler + AuthorName: Mapbox + AuthorURL: https://www.mapbox.com/ + - Title: cbers-tiler + URL: https://github.com/mapbox/cbers-tiler + AuthorName: Mapbox + AuthorURL: https://www.mapbox.com/ + - Title: CBERS static STAC catalog served by stac-browser + URL: https://cbers.stac.cloud + AuthorName: Radiant Earth + AuthorURL: https://github.com/radiantearth/stac-browser + Publications: diff --git a/datasets/cell-painting-image-collection.yaml b/datasets/cell-painting-image-collection.yaml index 9a9ec1426..a0574992a 100644 --- a/datasets/cell-painting-image-collection.yaml +++ b/datasets/cell-painting-image-collection.yaml @@ -31,7 +31,10 @@ Resources: Region: us-east-1 Type: S3 Bucket DataAtWork: - - Title: Example submission for the 2018 CytoData Hackathon (in R and Python) - URL: https://github.com/cytodata/cytodata-hackathon-2018/tree/master/cytodata-toolkit/ - AuthorName: Juan Caicedo, Tim Becker - AuthorURL: broadinstitute.org + Tutorials: + Tools & Applications: + Publications: + - Title: Example submission for the 2018 CytoData Hackathon (in R and Python) + URL: https://github.com/cytodata/cytodata-hackathon-2018/tree/master/cytodata-toolkit/ + AuthorName: Juan Caicedo, Tim Becker + AuthorURL: broadinstitute.org diff --git a/datasets/census-dataworld-pums.yaml b/datasets/census-dataworld-pums.yaml index dd00f699f..bebdc2725 100644 --- a/datasets/census-dataworld-pums.yaml +++ b/datasets/census-dataworld-pums.yaml @@ -16,7 +16,10 @@ Resources: Region: us-east-1 Type: S3 Bucket DataAtWork: - - Title: Setting up Blazegraph on EC2 - URL: https://docs.data.world/uscensus/#50---getting-started - AuthorName: data.world - AuthorURL: https://data.world/ + Tutorials: + - Title: Setting up Blazegraph on EC2 + URL: https://docs.data.world/uscensus/#50---getting-started + AuthorName: data.world + AuthorURL: https://data.world/ + Tools & Applications: + Publications: diff --git a/datasets/cgiardata.yaml b/datasets/cgiardata.yaml index 4c3882d08..98ae9d050 100644 --- a/datasets/cgiardata.yaml +++ b/datasets/cgiardata.yaml @@ -14,4 +14,8 @@ Resources: - Description: ARC GRID, and ARC ASCII format compressed ARN: arn:aws:s3:::cgiardata Region: us-west-2 - Type: S3 Bucket \ No newline at end of file + Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/commoncrawl.yaml b/datasets/commoncrawl.yaml index 228f79c17..92f6f504f 100644 --- a/datasets/commoncrawl.yaml +++ b/datasets/commoncrawl.yaml @@ -17,41 +17,44 @@ Resources: Region: us-east-1 Type: S3 Bucket DataAtWork: - - Title: Dresden Web Table Corpus (DWTC) - URL: https://wwwdb.inf.tu-dresden.de/research-projects/dresden-web-table-corpus/ - AuthorName: Database Systems Group Dresden - AuthorURL: https://wwwdb.inf.tu-dresden.de/ - - Title: Building a Web-Scale Dependency-Parsed Corpus from CommonCrawl - URL: https://arxiv.org/pdf/1710.01779.pdf - AuthorName: Alexander Panchenko, et al. - - Title: Index to WARC Files and URLs in Columnar Format - URL: http://commoncrawl.org/2018/03/index-to-warc-files-and-urls-in-columnar-format/ - AuthorName: Sebastian Nagel - - Title: Learning word vectors for 157 languages - URL: https://arxiv.org/abs/1802.06893 - AuthorName: Facebook AI Research - AuthorURL: https://fasttext.cc/docs/en/crawl-vectors.html - - Title: Using open data to predict market movements - URL: https://education.emc.com/content/dam/dell-emc/documents/en-us/2017KS_Ravinder-Using_Open_Data_to_Predict_Market_Movements.pdf - AuthorName: DELL EMC - - Title: N-gram counts and language models from the Common Crawl - URL: http://www.lrec-conf.org/proceedings/lrec2014/pdf/1097_Paper.pdf - AuthorName: Christian Buck, Kenneth Heafield, Bas van Ooyen - AuthorURL: http://statmt.org/ngrams/ - - Title: Large-scale analysis of style injection by relative path overwrite - URL: https://doi.org/10.1145/3178876.3186090 - AuthorName: Sajjad Arshad, et al. - - Title: Web Data Commons - RDFa, microdata, and microformat data sets - URL: http://webdatacommons.org/structureddata/ - AuthorName: Christian Bizer, Robert Meusel, Anna Primpeli - - Title: "C4Corpus: Multilingual Web-Size Corpus with Free License" - URL: http://www.lrec-conf.org/proceedings/lrec2016/pdf/388_Paper.pdf - AuthorName: Ivan Habernal, Omnia Zayed, Iryna Gurevych - AuthorURL: https://dkpro.github.io/dkpro-c4corpus/ - - Title: Of using Common Crawl to play Family Feud - URL: https://fulmicoton.com/posts/commoncrawl/ - AuthorName: Paul Masurel - - Title: Large-scale graph mining with Spark - URL: https://towardsdatascience.com/large-scale-graph-mining-with-spark-750995050656 - AuthorName: Win Suen - AuthorURL: https://github.com/wsuen/pygotham2018_graphmining + Tutorials: + - Title: Large-scale graph mining with Spark + URL: https://towardsdatascience.com/large-scale-graph-mining-with-spark-750995050656 + AuthorName: Win Suen + AuthorURL: https://github.com/wsuen/pygotham2018_graphmining + - Title: Learning word vectors for 157 languages + URL: https://arxiv.org/abs/1802.06893 + AuthorName: Facebook AI Research + AuthorURL: https://fasttext.cc/docs/en/crawl-vectors.html + Tools & Applications: + - Title: Dresden Web Table Corpus (DWTC) + URL: https://wwwdb.inf.tu-dresden.de/research-projects/dresden-web-table-corpus/ + AuthorName: Database Systems Group Dresden + AuthorURL: https://wwwdb.inf.tu-dresden.de/ + - Title: Index to WARC Files and URLs in Columnar Format + URL: http://commoncrawl.org/2018/03/index-to-warc-files-and-urls-in-columnar-format/ + AuthorName: Sebastian Nagel + Publications: + - Title: Building a Web-Scale Dependency-Parsed Corpus from CommonCrawl + URL: https://arxiv.org/pdf/1710.01779.pdf + AuthorName: Alexander Panchenko, et al. + - Title: Using open data to predict market movements + URL: https://education.emc.com/content/dam/dell-emc/documents/en-us/2017KS_Ravinder-Using_Open_Data_to_Predict_Market_Movements.pdf + AuthorName: DELL EMC + - Title: N-gram counts and language models from the Common Crawl + URL: http://www.lrec-conf.org/proceedings/lrec2014/pdf/1097_Paper.pdf + AuthorName: Christian Buck, Kenneth Heafield, Bas van Ooyen + AuthorURL: http://statmt.org/ngrams/ + - Title: Large-scale analysis of style injection by relative path overwrite + URL: https://doi.org/10.1145/3178876.3186090 + AuthorName: Sajjad Arshad, et al. + - Title: Web Data Commons - RDFa, microdata, and microformat data sets + URL: http://webdatacommons.org/structureddata/ + AuthorName: Christian Bizer, Robert Meusel, Anna Primpeli + - Title: "C4Corpus: Multilingual Web-Size Corpus with Free License" + URL: http://www.lrec-conf.org/proceedings/lrec2016/pdf/388_Paper.pdf + AuthorName: Ivan Habernal, Omnia Zayed, Iryna Gurevych + AuthorURL: https://dkpro.github.io/dkpro-c4corpus/ + - Title: Of using Common Crawl to play Family Feud + URL: https://fulmicoton.com/posts/commoncrawl/ + AuthorName: Paul Masurel diff --git a/datasets/cornell-eas-data-lake.yaml b/datasets/cornell-eas-data-lake.yaml index b63e17405..9466e3a73 100644 --- a/datasets/cornell-eas-data-lake.yaml +++ b/datasets/cornell-eas-data-lake.yaml @@ -1,16 +1,16 @@ Name: 'Cornell EAS Data Lake' Description: > - Earth & Atmospheric Sciences at Cornell University has created a public data - lake of climate data. The data is stored in columnar storage formats (ORC) to - make it straightforward to query using standard tools like Amazon - Athena or Apache Spark. The data itself is originally intended to be used for - building decision support tools for farmers and digital agriculture. The first - dataset is the historical NDFD / NDGD data distributed by NCEP / NOAA / NWS. - The NDFD (National Digital Forecast Database) and NDGD (National Digital Guidance Database) - contain gridded forecasts and observations at 2.5km resolution for the Contiguous - United States (CONUS). There are also 5km grids for several smaller US regions and - non-continguous territories, such as Hawaii, Guam, Puerto Rico and Alaska. NOAA - distributes archives of the NDFD/NDGD via its NOAA Operational Model Archive and Distribution System (NOMADS) + Earth & Atmospheric Sciences at Cornell University has created a public data + lake of climate data. The data is stored in columnar storage formats (ORC) to + make it straightforward to query using standard tools like Amazon + Athena or Apache Spark. The data itself is originally intended to be used for + building decision support tools for farmers and digital agriculture. The first + dataset is the historical NDFD / NDGD data distributed by NCEP / NOAA / NWS. + The NDFD (National Digital Forecast Database) and NDGD (National Digital Guidance Database) + contain gridded forecasts and observations at 2.5km resolution for the Contiguous + United States (CONUS). There are also 5km grids for several smaller US regions and + non-continguous territories, such as Hawaii, Guam, Puerto Rico and Alaska. NOAA + distributes archives of the NDFD/NDGD via its NOAA Operational Model Archive and Distribution System (NOMADS) in Grib2 format. The data has been converted to ORC to optimize storage space and to, more importantly, simplify data access via standard data analytics tools. @@ -41,14 +41,17 @@ Resources: ARN: arn:aws:sns:us-east-2:003709786761:cornell-eas-data-lake-human Region: us-east-2 Type: SNS Topic - + - Description: 'Cornell EAS Data Lake Automation Notifications. Used to send JSON notifications to automated build pipelines and ETL jobs when the EAS Data Lake is updated.' ARN: arn:aws:sns:us-east-2:003709786761:cornell-eas-data-lake Region: us-east-2 Type: SNS Topic - + DataAtWork: - - Title: Cornell EAS Data Lake Setup Tutorial - URL: https://datalake.eas.cornell.edu/tutorial.html - AuthorName: Marty Sullivan - AuthorURL: http://martysullivan.com + Tutorials: + - Title: Cornell EAS Data Lake Setup Tutorial + URL: https://datalake.eas.cornell.edu/tutorial.html + AuthorName: Marty Sullivan + AuthorURL: http://martysullivan.com + Tools & Applications: + Publications: diff --git a/datasets/cosmo-d2-eps.yaml b/datasets/cosmo-d2-eps.yaml index 813364541..a67dc8486 100644 --- a/datasets/cosmo-d2-eps.yaml +++ b/datasets/cosmo-d2-eps.yaml @@ -21,4 +21,8 @@ Resources: ARN: arn:aws:s3:::dwd-cosmo-d2-eps-pds Region: eu-central-1 Type: S3 Bucket - +DataAtWork: + Tutorials: + Tools & Applications: + Publications: + diff --git a/datasets/cse-cic-ids2018.yaml b/datasets/cse-cic-ids2018.yaml index dcecc5369..38b72d0e2 100644 --- a/datasets/cse-cic-ids2018.yaml +++ b/datasets/cse-cic-ids2018.yaml @@ -18,3 +18,7 @@ Resources: ARN: arn:aws:s3:::cse-cic-ids2018 Region: ca-central-1 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/daily-coin-data.yaml b/datasets/daily-coin-data.yaml deleted file mode 100644 index b1b1734c0..000000000 --- a/datasets/daily-coin-data.yaml +++ /dev/null @@ -1,24 +0,0 @@ -Name: Collection of daily coin data from Coin Metrics -Description: | - This project is set to pull the latest daily coin data from Coin Metrics using the data.world sync applet on IFTTT. - Daily on-chain transaction volume is calculated as the sum of all transaction outputs belonging to the blocks mined on the given day. "Change" outputs are not included. - Transaction count figure doesn’t include coinbase transactions. -Documentation: https://data.world/scuttlemonkey/coin-metrics -Contact: https://data.world/scuttlemonkey/coin-metrics/discuss -UpdateFrequency: Daily -Tags: - - financial markets - - economics - - bitcoin - - blockchain -License: MIT License -Resources: - - Description: Project data files - ARN: arn:aws:s3:::dataworld-odaws-us-east-1/datasets/scuttlemonkey/coin-metrics/ - Region: us-east-1 - Type: S3 Bucket -DataAtWork: - - Title: Collection of daily coin data from Coin Metrics. - URL: https://data.world/scuttlemonkey/coin-metrics - AuthorName: "@scuttlemonkey on data.world" - AuthorURL: https://data.world/scuttlemonkey diff --git a/datasets/dataforgood-fb-hrsl.yaml b/datasets/dataforgood-fb-hrsl.yaml index 3ce759443..f6b776432 100644 --- a/datasets/dataforgood-fb-hrsl.yaml +++ b/datasets/dataforgood-fb-hrsl.yaml @@ -4,7 +4,7 @@ Description: | and Cloud-optimized GeoTIFF files. This refines [CIESIN’s Gridded Population of the World](https://sedac.ciesin.columbia.edu/data/collection/gpw-v4) using machine learning models on high-resolution worldwide Digital Globe satellite imagery. CIESIN population counts aggregated from worldwide census - data are allocated to blocks where imagery appears to contain buildings. + data are allocated to blocks where imagery appears to contain buildings. Documentation: "[Project overview](https://dataforgood.fb.com/population-density-maps-documentation/) and [dataset description](https://docs.opendata.aws/dataforgood-fb-data/readme.html)" Contact: disastermaps@fb.com ManagedBy: | @@ -31,7 +31,11 @@ License: | Settlement Layer (HRSL). Source imagery for HRSL © 2016 [DigitalGlobe](http://explore.digitalglobe.com/Basemap-Vivid.html). Accessed DAY MONTH YEAR. Resources: - - Description: CSV and Cloud-optimized GeoTIFF files + - Description: CSV and Cloud-optimized GeoTIFF files ARN: arn:aws:s3:::dataforgood-fb-data Region: us-east-1 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/dc-lidar-2015.yaml b/datasets/dc-lidar-2015.yaml index 37f328270..ac2bafe90 100644 --- a/datasets/dc-lidar-2015.yaml +++ b/datasets/dc-lidar-2015.yaml @@ -25,3 +25,7 @@ Resources: ARN: arn:aws:s3:::dc-lidar-2018 Region: us-east-1 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/dc-lidar.yaml b/datasets/dc-lidar.yaml index d78927728..3c328993e 100644 --- a/datasets/dc-lidar.yaml +++ b/datasets/dc-lidar.yaml @@ -23,3 +23,7 @@ Resources: ARN: arn:aws:s3:::dc-lidar-2018 Region: us-east-1 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/deutsche-boerse-pds.yaml b/datasets/deutsche-boerse-pds.yaml index 533047764..599fa65a1 100644 --- a/datasets/deutsche-boerse-pds.yaml +++ b/datasets/deutsche-boerse-pds.yaml @@ -19,15 +19,18 @@ Resources: Region: eu-central-1 Type: S3 Bucket DataAtWork: - - Title: "Stock Price Movement Prediction Using The Deutsche Börse Public Dataset & Machine Learning" - URL: https://github.com/Originate/dbg-pds-tensorflow-demo - AuthorName: Originate - AuthorURL: https://www.originate.com - - Title: 10 visualizations to try in Amazon QuickSight with sample data - URL: https://aws.amazon.com/blogs/big-data/10-visualizations-to-try-in-amazon-quicksight-with-sample-data/ - AuthorName: AWS Big Data Blog - AuthorURL: https://aws.amazon.com/blogs/big-data/ - - Title: Streaming XETRA Data Using Apache Spark - URL: http://live.thermobook.net/dataStreamingWeb - AuthorName: Thermobook - AuthorURL: http://www.thermobook.net + Tutorials: + - Title: "Stock Price Movement Prediction Using The Deutsche Börse Public Dataset & Machine Learning" + URL: https://github.com/Originate/dbg-pds-tensorflow-demo + AuthorName: Originate + AuthorURL: https://www.originate.com + - Title: 10 visualizations to try in Amazon QuickSight with sample data + URL: https://aws.amazon.com/blogs/big-data/10-visualizations-to-try-in-amazon-quicksight-with-sample-data/ + AuthorName: AWS Big Data Blog + AuthorURL: https://aws.amazon.com/blogs/big-data/ + Tools & Applications: + - Title: Streaming XETRA Data Using Apache Spark + URL: http://live.thermobook.net/dataStreamingWeb + AuthorName: Thermobook + AuthorURL: http://www.thermobook.net + Publications: diff --git a/datasets/digital-globe-open-data.yaml b/datasets/digital-globe-open-data.yaml index b9d2a2b5e..d20c10b97 100644 --- a/datasets/digital-globe-open-data.yaml +++ b/datasets/digital-globe-open-data.yaml @@ -17,3 +17,7 @@ Resources: Host: opendata.digitalglobe.com Region: us-east-1 Type: CloudFront Distribution +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/dwd-cosmo-d2-pds.yaml b/datasets/dwd-cosmo-d2-pds.yaml index 6db341fc7..3aaaaba29 100644 --- a/datasets/dwd-cosmo-d2-pds.yaml +++ b/datasets/dwd-cosmo-d2-pds.yaml @@ -21,3 +21,7 @@ Resources: ARN: arn:aws:s3:::dwd-cosmo-d2-pds Region: eu-central-1 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/dwd-icon-eu-pds.yaml b/datasets/dwd-icon-eu-pds.yaml index 790e3f346..dae78f69f 100644 --- a/datasets/dwd-icon-eu-pds.yaml +++ b/datasets/dwd-icon-eu-pds.yaml @@ -20,4 +20,8 @@ Resources: - Description: model output in GRIB2 data format for commonly used parameters ARN: arn:aws:s3:::dwd-icon-eu-pds Region: eu-central-1 - Type: S3 Bucket \ No newline at end of file + Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/dwd-icon-global-pds.yaml b/datasets/dwd-icon-global-pds.yaml index b4688ca17..e341263ff 100644 --- a/datasets/dwd-icon-global-pds.yaml +++ b/datasets/dwd-icon-global-pds.yaml @@ -20,4 +20,8 @@ Resources: - Description: model output in GRIB2 data format for commonly used parameters ARN: arn:aws:s3:::dwd-icon-global-pds Region: eu-central-1 - Type: S3 Bucket \ No newline at end of file + Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/ebirdst.yaml b/datasets/ebirdst.yaml index 63f5d354a..44fd6f7a3 100644 --- a/datasets/ebirdst.yaml +++ b/datasets/ebirdst.yaml @@ -1,9 +1,9 @@ Name: eBird Status and Trends Model Results Description: | - The eBird Status and Trends project generates estimates of bird - occurrence and abundance at a high spatiotemporal resolution. + The eBird Status and Trends project generates estimates of bird + occurrence and abundance at a high spatiotemporal resolution. This dataset represents the primary modeled results from the - analysis workflow and are designed for further analysis, + analysis workflow and are designed for further analysis, synthesis, visualization, and exploration. Documentation: https://cornelllabofornithology.github.io/ebirdst/articles/ebirdst-introduction.html Contact: https://help.ebird.org/customer/en/portal/emails/new @@ -25,24 +25,27 @@ Resources: Region: us-west-2 Type: S3 Bucket DataAtWork: - - Title: eBird Status and Trends Visualizations - URL: https://ebird.org/science/status-and-trends - AuthorName: Cornell Lab of Ornithology - - Title: ebirdst R Package - URL: https://cornelllabofornithology.github.io/ebirdst/ - AuthorName: Cornell Lab of Ornithology - - Title: ebirdst - Background, Data Access and Data Structure - URL: https://cornelllabofornithology.github.io/ebirdst/articles/ebirdst-introduction.html - AuthorName: Tom Auer and Daniel Fink - - Title: ebirdst - Intro Mapping - URL: https://cornelllabofornithology.github.io/ebirdst/articles/ebirdst-intro-mapping.html - AuthorName: Tom Auer and Daniel Fink - - Title: ebirdst - Generating Seasonal Abundance and Range Maps and Stats - URL: https://cornelllabofornithology.github.io/ebirdst/articles/ebirdst-advanced-mapping.html - AuthorName: Matt Strimas-Mackey, Tom Auer, and Daniel Fink - - Title: ebirdst - Non-raster Data - URL: https://cornelllabofornithology.github.io/ebirdst/articles/ebirdst-non-raster.html - AuthorName: Tom Auer and Daniel Fink - - Title: eBird Status and Trends FAQ - URL: https://ebird.org/science/status-and-trends/faq - AuthorName: Cornell Lab of Ornithology + Tutorials: + - Title: eBird Status and Trends Visualizations + URL: https://ebird.org/science/status-and-trends + AuthorName: Cornell Lab of Ornithology + - Title: ebirdst - Background, Data Access and Data Structure + URL: https://cornelllabofornithology.github.io/ebirdst/articles/ebirdst-introduction.html + AuthorName: Tom Auer and Daniel Fink + - Title: ebirdst - Intro Mapping + URL: https://cornelllabofornithology.github.io/ebirdst/articles/ebirdst-intro-mapping.html + AuthorName: Tom Auer and Daniel Fink + - Title: ebirdst - Generating Seasonal Abundance and Range Maps and Stats + URL: https://cornelllabofornithology.github.io/ebirdst/articles/ebirdst-advanced-mapping.html + AuthorName: Matt Strimas-Mackey, Tom Auer, and Daniel Fink + - Title: ebirdst - Non-raster Data + URL: https://cornelllabofornithology.github.io/ebirdst/articles/ebirdst-non-raster.html + AuthorName: Tom Auer and Daniel Fink + - Title: eBird Status and Trends FAQ + URL: https://ebird.org/science/status-and-trends/faq + AuthorName: Cornell Lab of Ornithology + Tools & Applications: + - Title: ebirdst R Package + URL: https://cornelllabofornithology.github.io/ebirdst/ + AuthorName: Cornell Lab of Ornithology + Publications: diff --git a/datasets/ecmwf-era5.yaml b/datasets/ecmwf-era5.yaml index 7ab5edc0d..11a1e2c13 100644 --- a/datasets/ecmwf-era5.yaml +++ b/datasets/ecmwf-era5.yaml @@ -21,11 +21,14 @@ Resources: Region: us-east-1 Type: S3 Bucket DataAtWork: - - Title: Accessing ERA5 Data on S3 Using Boto - URL: https://github.com/planet-os/notebooks/blob/master/aws/era5-s3-via-boto.ipynb - AuthorName: Intertrust Technologies Corporation - AuthorURL: https://www.intertrust.com/ - - Title: ERA5 tutorial using the Planet OS API - URL: https://github.com/planet-os/notebooks/blob/master/api-examples/ERA5_tutorial.ipynb - AuthorName: Intertrust Technologies Corporation - AuthorURL: https://www.intertrust.com/ + Tutorials: + - Title: Accessing ERA5 Data on S3 Using Boto + URL: https://github.com/planet-os/notebooks/blob/master/aws/era5-s3-via-boto.ipynb + AuthorName: Intertrust Technologies Corporation + AuthorURL: https://www.intertrust.com/ + - Title: ERA5 tutorial using the Planet OS API + URL: https://github.com/planet-os/notebooks/blob/master/api-examples/ERA5_tutorial.ipynb + AuthorName: Intertrust Technologies Corporation + AuthorURL: https://www.intertrust.com/ + Tools & Applications: + Publications: diff --git a/datasets/encode-project.yaml b/datasets/encode-project.yaml index dbb144609..a7e9b2c72 100644 --- a/datasets/encode-project.yaml +++ b/datasets/encode-project.yaml @@ -32,15 +32,18 @@ Resources: Region: us-west-2 Type: S3 Bucket DataAtWork: - - Title: Exploring ENCODE data from EC2 with Jupyter notebook - URL: https://github.com/ENCODE-DCC/encode-data-usage-examples/blob/master/mount_s3_bucket_and_run_jupyter_on_ec2.ipynb - AuthorName: Keenan Graham - AuthorURL: https://github.com/keenangraham - - Title: ENCODE CTCF ChIP-seq data correlation across different cell types - URL: https://github.com/ENCODE-DCC/encode-data-usage-examples/blob/master/ctcf_chip_seq_cross_cell_type_correlation.ipynb - AuthorName: Paul Sud - AuthorURL: https://github.com/p-sud - - Title: Ingesting ENCODE data into TileDB with S3 backend - URL: https://github.com/ENCODE-DCC/encode-data-usage-examples/blob/master/ingest_encode_data_tile_db_with_s3_backend.ipynb - AuthorName: Otto Jolanki - AuthorURL: https://github.com/ottojolanki + Tutorials: + - Title: Exploring ENCODE data from EC2 with Jupyter notebook + URL: https://github.com/ENCODE-DCC/encode-data-usage-examples/blob/master/mount_s3_bucket_and_run_jupyter_on_ec2.ipynb + AuthorName: Keenan Graham + AuthorURL: https://github.com/keenangraham + - Title: ENCODE CTCF ChIP-seq data correlation across different cell types + URL: https://github.com/ENCODE-DCC/encode-data-usage-examples/blob/master/ctcf_chip_seq_cross_cell_type_correlation.ipynb + AuthorName: Paul Sud + AuthorURL: https://github.com/p-sud + - Title: Ingesting ENCODE data into TileDB with S3 backend + URL: https://github.com/ENCODE-DCC/encode-data-usage-examples/blob/master/ingest_encode_data_tile_db_with_s3_backend.ipynb + AuthorName: Otto Jolanki + AuthorURL: https://github.com/ottojolanki + Tools & Applications: + Publications: diff --git a/datasets/epa-rsei-pds.yaml b/datasets/epa-rsei-pds.yaml index e7c436441..fe411f9ff 100644 --- a/datasets/epa-rsei-pds.yaml +++ b/datasets/epa-rsei-pds.yaml @@ -13,3 +13,7 @@ Resources: ARN: arn:aws:s3:::epa-rsei-pds Region: us-east-1 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/epoch-of-reionization.yaml b/datasets/epoch-of-reionization.yaml index f9ce5353e..4c27cc662 100644 --- a/datasets/epoch-of-reionization.yaml +++ b/datasets/epoch-of-reionization.yaml @@ -21,3 +21,7 @@ Resources: ARN: arn:aws:s3:::mwapublic Region: us-east-1 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/fast-ai-coco.yaml b/datasets/fast-ai-coco.yaml index 9bc017da2..af10cb11f 100644 --- a/datasets/fast-ai-coco.yaml +++ b/datasets/fast-ai-coco.yaml @@ -19,4 +19,7 @@ Resources: ARN: arn:aws:s3:::fast-ai-coco Region: us-east-1 Type: S3 Bucket - +DataAtWork: + Tutorials: + Tools & Applications: + Publications: diff --git a/datasets/fast-ai-imageclas.yaml b/datasets/fast-ai-imageclas.yaml index 4dd0b1492..5f2ffcc22 100644 --- a/datasets/fast-ai-imageclas.yaml +++ b/datasets/fast-ai-imageclas.yaml @@ -20,4 +20,7 @@ Resources: ARN: arn:aws:s3:::fast-ai-imageclas Region: us-east-1 Type: S3 Bucket - +DataAtWork: + Tutorials: + Tools & Applications: + Publications: diff --git a/datasets/fast-ai-imagelocal.yaml b/datasets/fast-ai-imagelocal.yaml index b052cd4d2..b944a0c53 100644 --- a/datasets/fast-ai-imagelocal.yaml +++ b/datasets/fast-ai-imagelocal.yaml @@ -19,4 +19,7 @@ Resources: ARN: arn:aws:s3:::fast-ai-imagelocal Region: us-east-1 Type: S3 Bucket - +DataAtWork: + Tutorials: + Tools & Applications: + Publications: diff --git a/datasets/fast-ai-nlp.yaml b/datasets/fast-ai-nlp.yaml index 7664cb236..daed7df46 100644 --- a/datasets/fast-ai-nlp.yaml +++ b/datasets/fast-ai-nlp.yaml @@ -22,4 +22,7 @@ Resources: ARN: arn:aws:s3:::fast-ai-nlp Region: us-east-1 Type: S3 Bucket - +DataAtWork: + Tutorials: + Tools & Applications: + Publications: diff --git a/datasets/federal-government-awards.yaml b/datasets/federal-government-awards.yaml deleted file mode 100644 index 8f374a564..000000000 --- a/datasets/federal-government-awards.yaml +++ /dev/null @@ -1,22 +0,0 @@ -Name: Federal Government Awards -Description: | - The Federal Awards dataset contains a complete export of the data available from USASpending. This dataset reflects all observations submitted through the third quarter of fiscal year 2017. -Documentation: https://data.world/usaspending/federal-government-awards-in-q-2 -Contact: https://data.world/usaspending/federal-government-awards-in-q-2/discuss -UpdateFrequency: Quarterly -Tags: - - census - - government spending - - regulatory - - us -License: CC-0 -Resources: - - Description: Project data files - ARN: arn:aws:s3:::dataworld-odaws-us-east-1/datasets/usaspending/federal-government-awards-in-q-2/ - Region: us-east-1 - Type: S3 Bucket -DataAtWork: - - Title: Federal government awards data - URL: https://data.world/usaspending/federal-government-awards-in-q-2 - AuthorName: U.S. Department of Treasury @usaspending on data.world - AuthorURL: https://data.world/usaspending diff --git a/datasets/gatk-test-data.yaml b/datasets/gatk-test-data.yaml index 017c44843..18c8ae185 100644 --- a/datasets/gatk-test-data.yaml +++ b/datasets/gatk-test-data.yaml @@ -20,7 +20,10 @@ Resources: Region: us-east-1 Type: S3 Bucket DataAtWork: - - Title: Genomics Workflows on AWS - Cromwell on AWS - URL: https://docs.opendata.aws/genomics-workflows/orchestration/cromwell/cromwell-examples/#real-world-example-haplotypecaller - AuthorName: W. Lee Pang - AuthorURL: https://www.linkedin.com/in/lee-pang-a039a26/ + Tutorials: + Tools & Applications: + - Title: Genomics Workflows on AWS - Cromwell on AWS + URL: https://docs.opendata.aws/genomics-workflows/orchestration/cromwell/cromwell-examples/#real-world-example-haplotypecaller + AuthorName: W. Lee Pang + AuthorURL: https://www.linkedin.com/in/lee-pang-a039a26/ + Publications: diff --git a/datasets/gdelt.yaml b/datasets/gdelt.yaml index 9c0f1eb4d..f25fc6725 100644 --- a/datasets/gdelt.yaml +++ b/datasets/gdelt.yaml @@ -24,27 +24,30 @@ Resources: Region: us-east-1 Type: SNS Topic DataAtWork: - - Title: Exploring GDELT with Athena - URL: http://blog.julien.org/2017/03/exploring-gdelt-data-set-with-amazon.html - AuthorName: Julien Simon - AuthorURL: https://twitter.com/julsimon - - Title: Running R on Amazon Athena - URL: https://aws.amazon.com/blogs/big-data/running-r-on-amazon-athena/ - AuthorName: Gopal Wunnava - AuthorURL: https://www.linkedin.com/in/gopal-wunnava-b11a77/ - - Title: Bootstrapping GeoMesa HBase on AWS S3 - URL: http://www.geomesa.org/documentation/tutorials/geomesa-hbase-s3-on-aws.html - AuthorName: Commonwealth Computer Research, Inc. - AuthorURL: https://www.ccri.com - - Title: Creating PySpark DataFrame from CSV in AWS S3 in EMR - URL: https://gist.github.com/jakechen/6955f2de51212163312b6430555b8e0b - AuthorName: Jake Chen - AuthorURL: https://github.com/jakechen - - Title: Globe Events - URL: http://live.thermobook.net/globe-events/ - AuthorName: thermobook - AuthorURL: http://www.thermobook.net - - Title: Analysing Brexit Coverage In The Media Over Time - URL: https://www.linkedin.com/pulse/media-brexit-story-so-far-may-corbyn-less-shambles-than-mark-chopping/ - AuthorName: Mark Chopping - AuthorURL: https://www.kognitio.com + Tutorials: + - Title: Exploring GDELT with Athena + URL: http://blog.julien.org/2017/03/exploring-gdelt-data-set-with-amazon.html + AuthorName: Julien Simon + AuthorURL: https://twitter.com/julsimon + - Title: Running R on Amazon Athena + URL: https://aws.amazon.com/blogs/big-data/running-r-on-amazon-athena/ + AuthorName: Gopal Wunnava + AuthorURL: https://www.linkedin.com/in/gopal-wunnava-b11a77/ + - Title: Bootstrapping GeoMesa HBase on AWS S3 + URL: http://www.geomesa.org/documentation/tutorials/geomesa-hbase-s3-on-aws.html + AuthorName: Commonwealth Computer Research, Inc. + AuthorURL: https://www.ccri.com + - Title: Creating PySpark DataFrame from CSV in AWS S3 in EMR + URL: https://gist.github.com/jakechen/6955f2de51212163312b6430555b8e0b + AuthorName: Jake Chen + AuthorURL: https://github.com/jakechen + - Title: Analysing Brexit Coverage In The Media Over Time + URL: https://www.linkedin.com/pulse/media-brexit-story-so-far-may-corbyn-less-shambles-than-mark-chopping/ + AuthorName: Mark Chopping + AuthorURL: https://www.kognitio.com + Tools & Applications: + - Title: Globe Events + URL: http://live.thermobook.net/globe-events/ + AuthorName: thermobook + AuthorURL: http://www.thermobook.net + Publications: \ No newline at end of file diff --git a/datasets/genomeark.yaml b/datasets/genomeark.yaml index 1b432755c..ce3b6eae9 100644 --- a/datasets/genomeark.yaml +++ b/datasets/genomeark.yaml @@ -17,3 +17,7 @@ Resources: ARN: arn:aws:s3:::genomeark Region: us-east-1 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/geoschem-input-data.yaml b/datasets/geoschem-input-data.yaml index 00764055e..4fc193f33 100644 --- a/datasets/geoschem-input-data.yaml +++ b/datasets/geoschem-input-data.yaml @@ -18,15 +18,18 @@ Resources: Region: us-east-1 Type: S3 Bucket DataAtWork: - - Title: Tutorial on accessing GEOS-Chem data bucket in S3 - URL: http://cloud-gc.readthedocs.io/en/stable/chapter02_beginner-tutorial/use-s3.html#access-geos-chem-input-data-repository-in-s3 - AuthorName: Jiawei Zhuang - AuthorURL: https://github.com/JiaweiZhuang - - Title: Overview of the GEOSChem-on-cloud project - URL: http://acmg.seas.harvard.edu/research.html#cloud - AuthorName: Atmospheric Chemistry Modeling Group, Harvard University - AuthorURL: http://acmg.seas.harvard.edu/index.html - - Title: Running GEOS-Chem on Cloud Computing Platforms, presented at the 8th International GEOS-Chem Meeting - URL: http://acmg.seas.harvard.edu/presentations/IGC8/posters/Mon_Posters_Zhuang_Jiawei.pdf - AuthorName: Jiawei Zhuang, et al. - AuthorURL: https://github.com/JiaweiZhuang + Tutorials: + - Title: Tutorial on accessing GEOS-Chem data bucket in S3 + URL: http://cloud-gc.readthedocs.io/en/stable/chapter02_beginner-tutorial/use-s3.html#access-geos-chem-input-data-repository-in-s3 + AuthorName: Jiawei Zhuang + AuthorURL: https://github.com/JiaweiZhuang + Tools & Applications: + Publications: + - Title: Overview of the GEOSChem-on-cloud project + URL: http://acmg.seas.harvard.edu/research.html#cloud + AuthorName: Atmospheric Chemistry Modeling Group, Harvard University + AuthorURL: http://acmg.seas.harvard.edu/index.html + - Title: Running GEOS-Chem on Cloud Computing Platforms, presented at the 8th International GEOS-Chem Meeting + URL: http://acmg.seas.harvard.edu/presentations/IGC8/posters/Mon_Posters_Zhuang_Jiawei.pdf + AuthorName: Jiawei Zhuang, et al. + AuthorURL: https://github.com/JiaweiZhuang diff --git a/datasets/giab.yaml b/datasets/giab.yaml index 74f185ee1..1922ecd12 100644 --- a/datasets/giab.yaml +++ b/datasets/giab.yaml @@ -8,9 +8,13 @@ Tags: - genomic - life sciences License: | - There are no restrictions on the use of this data. More information on citation is available [here](https://sites.stanford.edu/abms/content/giab-reference-materials-and-data). + There are no restrictions on the use of this data. More information on citation is available [here](https://www.nist.gov/programs-projects/genome-bottle). Resources: - Description: Latest data ARN: arn:aws:s3:::giab - Region: us-east-1 + Region: us-west-2 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: diff --git a/datasets/gmsdata.yaml b/datasets/gmsdata.yaml index e4afb2bb0..6dff0bc87 100644 --- a/datasets/gmsdata.yaml +++ b/datasets/gmsdata.yaml @@ -13,4 +13,8 @@ Resources: - Description: https://gmsdata.s3.amazonaws.com/INDEX.html ARN: arn:aws:s3:::gmsdata Region: us-west-2 - Type: S3 Bucket \ No newline at end of file + Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/google-ngrams.yaml b/datasets/google-ngrams.yaml index 38da72134..9891a6e31 100644 --- a/datasets/google-ngrams.yaml +++ b/datasets/google-ngrams.yaml @@ -11,4 +11,8 @@ Resources: - Description: A data set containing Google Books n-gram corpora in a Hadoop friendly file format. ARN: arn:aws:s3:::datasets.elasticmapreduce/ngrams/books/ Region: us-east-1 - Type: S3 Bucket \ No newline at end of file + Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/grillo-openeew.yaml b/datasets/grillo-openeew.yaml index a9169504a..b3dffdc36 100644 --- a/datasets/grillo-openeew.yaml +++ b/datasets/grillo-openeew.yaml @@ -22,11 +22,14 @@ Resources: Region: us-east-1 Type: S3 Bucket DataAtWork: - - Title: OpenEEW library for Python - URL: https://github.com/grillo/openeew-python - AuthorName: Grillo - AuthorURL: https://grillo.io/openeew/ - - Title: Analyzing a magnitude 7.2 earthquake in Mexico using Python - URL: https://blog.grillo.io/analyzing-a-magnitude-7-2-earthquake-in-mexico-using-python-6272a4ff63e3 - AuthorName: Grillo - AuthorURL: https://grillo.io/openeew/ + Tutorials: + - Title: Analyzing a magnitude 7.2 earthquake in Mexico using Python + URL: https://blog.grillo.io/analyzing-a-magnitude-7-2-earthquake-in-mexico-using-python-6272a4ff63e3 + AuthorName: Grillo + AuthorURL: https://grillo.io/openeew/ + Tools & Applications: + - Title: OpenEEW library for Python + URL: https://github.com/grillo/openeew-python + AuthorName: Grillo + AuthorURL: https://grillo.io/openeew/ + Publications: diff --git a/datasets/hcp-openaccess.yaml b/datasets/hcp-openaccess.yaml index 4299d7b1a..2c221e1f8 100644 --- a/datasets/hcp-openaccess.yaml +++ b/datasets/hcp-openaccess.yaml @@ -12,4 +12,8 @@ Resources: - Description: https://wiki.humanconnectome.org/display/PublicData/HCP+Data+Release+Updates%3A+Known+Issues+and+Planned+fixes ARN: arn:aws:s3:::hcp-openaccess Region: us-east-1 - Type: S3 Bucket \ No newline at end of file + Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/hirlam.yaml b/datasets/hirlam.yaml index cd0add6e3..341cb6062 100644 --- a/datasets/hirlam.yaml +++ b/datasets/hirlam.yaml @@ -27,4 +27,8 @@ Resources: - Description: Notifications for new pressure data ARN: arn:aws:sns:eu-west-1:916174725480:new-fmi-opendata-rcrhirlam-pressure-grib Region: eu-west-1 - Type: SNS Topic \ No newline at end of file + Type: SNS Topic +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/hpgp-data.yaml b/datasets/hpgp-data.yaml index 4388df96e..8dd5905aa 100644 --- a/datasets/hpgp-data.yaml +++ b/datasets/hpgp-data.yaml @@ -11,5 +11,9 @@ License: Human PanGenomics Project data are licensed under the Creative Commons Resources: - Description: Human PanGenomics Project ARN: arn:aws:s3:::human-pangenomics - Region: us-east-1 + Region: us-west-2 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: diff --git a/datasets/hst.yaml b/datasets/hst.yaml index 6da7b12d2..da0ce7f81 100644 --- a/datasets/hst.yaml +++ b/datasets/hst.yaml @@ -20,11 +20,14 @@ Resources: Region: us-east-1 Type: SNS Topic DataAtWork: - - Title: Making HST Public Data Available on AWS - URL: https://mast-labs.stsci.io/2018/06/hst-public-data-on-aws - AuthorName: Arfon Smith - AuthorURL: https://twitter.com/arfon - - Title: Exploring AWS Lambda with cloud-hosted Hubble public data - URL: https://mast-labs.stsci.io/2018/06/exploring-aws-lambda-with-hst-public-data - AuthorName: Arfon Smith - AuthorURL: https://twitter.com/arfon + Tutorials: + - Title: Exploring AWS Lambda with cloud-hosted Hubble public data + URL: https://mast-labs.stsci.io/2018/06/exploring-aws-lambda-with-hst-public-data + AuthorName: Arfon Smith + AuthorURL: https://twitter.com/arfon + Tools & Applications: + Publications: + - Title: Making HST Public Data Available on AWS + URL: https://mast-labs.stsci.io/2018/06/hst-public-data-on-aws + AuthorName: Arfon Smith + AuthorURL: https://twitter.com/arfon diff --git a/datasets/human-microbiome-project.yaml b/datasets/human-microbiome-project.yaml index d8740bf4f..997ced32b 100644 --- a/datasets/human-microbiome-project.yaml +++ b/datasets/human-microbiome-project.yaml @@ -11,4 +11,8 @@ Resources: - Description: https://aws.amazon.com/datasets/human-microbiome-project/ ARN: arn:aws:s3:::human-microbiome-project Region: us-west-2 - Type: S3 Bucket \ No newline at end of file + Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/icgc.yaml b/datasets/icgc.yaml index 764bd08d7..e760dac42 100644 --- a/datasets/icgc.yaml +++ b/datasets/icgc.yaml @@ -17,4 +17,8 @@ Resources: - Description: This public Amazon S3 bucket contains analysis metadata in XML format for genome analysis results. More information at http://oicr.icgc.meta.s3.amazonaws.com/metadata/README ARN: arn:aws:s3:::oicr.icgc.meta/metadata Region: us-east-1 - Type: S3 Bucket \ No newline at end of file + Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/ichangemycity.yaml b/datasets/ichangemycity.yaml index 69d4ee6db..bd081772e 100644 --- a/datasets/ichangemycity.yaml +++ b/datasets/ichangemycity.yaml @@ -15,3 +15,7 @@ Resources: ARN: arn:aws:s3:::ichangemycity-janaagraha-complaints-data-aws Region: ap-south-1 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/icon-eu-eps.yaml b/datasets/icon-eu-eps.yaml index f31d4072d..2de98fd97 100644 --- a/datasets/icon-eu-eps.yaml +++ b/datasets/icon-eu-eps.yaml @@ -4,7 +4,7 @@ Documentation: https://s3.eu-central-1.amazonaws.com/dwd-pds-help/dwd-icon-eu-pd Contact: opendata@dwd.de ManagedBy: "[Deutscher Wetterdienst](https://www.dwd.de/)" UpdateFrequency: Every 3 hours -Tags: +Tags: - aws-pds - climate - disaster response @@ -21,3 +21,7 @@ Resources: ARN: arn:aws:s3:::dwd-icon-eu-eps-pds Region: eu-central-1 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/icon-global-eps.yaml b/datasets/icon-global-eps.yaml index 5acefddc8..d01e9d373 100644 --- a/datasets/icon-global-eps.yaml +++ b/datasets/icon-global-eps.yaml @@ -21,4 +21,7 @@ Resources: ARN: arn:aws:s3:::dwd-icon-global-eps-pds Region: eu-central-1 Type: S3 Bucket - +DataAtWork: + Tutorials: + Tools & Applications: + Publications: diff --git a/datasets/irs990.yaml b/datasets/irs990.yaml index de5300730..029c38fe7 100644 --- a/datasets/irs990.yaml +++ b/datasets/irs990.yaml @@ -14,38 +14,41 @@ Resources: Region: us-east-1 Type: S3 Bucket DataAtWork: - - Title: Parse 990 XML using IRSx - URL: https://github.com/jsfenfen/990-xml-reader - AuthorName: Jacob Fenton - AuthorURL: http://jacobfenton.com/ - - Title: aws-irs-990-explorer - URL: http://irs-990-explorer.chrisgherbert.com - AuthorName: Chris Herbert - AuthorURL: http://chrisgherbert.com/ - - Title: 990_long - URL: https://github.com/CharityNavigator/990_long - AuthorName: Charity Navigator - AuthorURL: https://www.charitynavigator.org/ - - Title: Non Profit Light - URL: http://nonprofitlight.com - AuthorName: Non Profit Light - - Title: Guide to Open Data for Nonprofit Research - URL: https://lecy.github.io/Open-Data-for-Nonprofit-Research/ - AuthorName: lecy - AuthorURL: https://github.com/lecy - - Title: Nonprofit Explorer - URL: https://projects.propublica.org/nonprofits/ - AuthorName: ProPublica - AuthorURL: https://propublica.org - - Title: Open990 - URL: https://www.open990.com/ - AuthorName: 990 Consulting, LLC - AuthorURL: https://www.990consulting.com/ - - Title: Tutorial on using the IRS 990 e-file dataset - URL: https://medium.com/@open990/the-irs-990-e-file-dataset-getting-to-the-chocolatey-center-of-data-deliciousness-90f66097a600 - AuthorName: 990 Consulting, LLC - AuthorURL: https://www.990consulting.com/ - - Title: Grantmakers.io - URL: https://www.grantmakers.io - AuthorName: Chad Kruse - AuthorURL: https://www.chadkruse.com/ + Tutorials: + - Title: Tutorial on using the IRS 990 e-file dataset + URL: https://medium.com/@open990/the-irs-990-e-file-dataset-getting-to-the-chocolatey-center-of-data-deliciousness-90f66097a600 + AuthorName: 990 Consulting, LLC + AuthorURL: https://www.990consulting.com/ + Tools & Applications: + - Title: Parse 990 XML using IRSx + URL: https://github.com/jsfenfen/990-xml-reader + AuthorName: Jacob Fenton + AuthorURL: http://jacobfenton.com/ + - Title: aws-irs-990-explorer + URL: http://irs-990-explorer.chrisgherbert.com + AuthorName: Chris Herbert + AuthorURL: http://chrisgherbert.com/ + - Title: 990_long + URL: https://github.com/CharityNavigator/990_long + AuthorName: Charity Navigator + AuthorURL: https://www.charitynavigator.org/ + - Title: Non Profit Light + URL: http://nonprofitlight.com + AuthorName: Non Profit Light + - Title: Guide to Open Data for Nonprofit Research + URL: https://lecy.github.io/Open-Data-for-Nonprofit-Research/ + AuthorName: lecy + AuthorURL: https://github.com/lecy + - Title: Nonprofit Explorer + URL: https://projects.propublica.org/nonprofits/ + AuthorName: ProPublica + AuthorURL: https://propublica.org + - Title: Open990 + URL: https://www.open990.com/ + AuthorName: 990 Consulting, LLC + AuthorURL: https://www.990consulting.com/ + - Title: Grantmakers.io + URL: https://www.grantmakers.io + AuthorName: Chad Kruse + AuthorURL: https://www.chadkruse.com/ + Publications: diff --git a/datasets/kitti.yaml b/datasets/kitti.yaml index 575536870..a820d7297 100644 --- a/datasets/kitti.yaml +++ b/datasets/kitti.yaml @@ -16,3 +16,7 @@ Resources: ARN: arn:aws:s3:::avg-kitti Region: eu-central-1 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/lab41-sri-voices.yaml b/datasets/lab41-sri-voices.yaml index c82c29d0f..bcd1e94e8 100644 --- a/datasets/lab41-sri-voices.yaml +++ b/datasets/lab41-sri-voices.yaml @@ -10,7 +10,7 @@ Description: | Documentation: https://voices18.github.io/ Contact: https://github.com/voices18/utilities/issues UpdateFrequency: Data from two additional rooms will be added to the corpus Fall 2018. -Tags: +Tags: - aws-pds - machine learning - automatic speech recognition @@ -24,6 +24,9 @@ Resources: Region: us-east-1 Type: S3 Bucket DataAtWork: - - Title: Getting started with VOiCES data - URL: https://github.com/voices18/utilities/blob/master/Using%20VOiCES%20corpus%20tutorial.ipynb - AuthorName: M.A. Barrios + Tutorials: + - Title: Getting started with VOiCES data + URL: https://github.com/voices18/utilities/blob/master/Using%20VOiCES%20corpus%20tutorial.ipynb + AuthorName: M.A. Barrios + Tools & Applications: + Publications: diff --git a/datasets/landsat-8.yaml b/datasets/landsat-8.yaml index e890c290a..a193a9538 100644 --- a/datasets/landsat-8.yaml +++ b/datasets/landsat-8.yaml @@ -26,60 +26,64 @@ Resources: - Description: "[S3 Inventory](https://docs.aws.amazon.com/AmazonS3/latest/dev/storage-inventory.html#storage-inventory-contents) (ORC)" ARN: arn:aws:s3:::landsat-pds-inventory Region: us-west-2 - Type: S3 Bucket + Type: S3 Bucket DataAtWork: - - Title: Development Seed Geolambda - URL: https://developmentseed.org/blog/2017/08/17/geolambdas/ - AuthorName: Matthew Hanson - AuthorURL: https://developmentseed.org/team/matt-hanson/ - - Title: FME Landsat-8 on AWS Reader - URL: https://docs.safe.com/fme/html/FME_Desktop_Documentation/FME_ReadersWriters/landsat8aws/landsat8aws.htm - AuthorName: Safe Software - AuthorURL: https://www.safe.com/ - - Title: FME Landsat-8/Sentinel-2 File Selector - URL: http://demos.fmeserver.com/landsat-sentinel-selector/ - AuthorName: Safe Software - AuthorURL: https://www.safe.com/ - - Title: Sentinel Hub WMS/WMTS/WCS Service for Landsat - URL: http://www.sentinel-hub.com/apps/wms - AuthorName: Sinergise - AuthorURL: http://www.sinergise.com/ - - Title: Sentinel Playground for Landsat - URL: https://apps.sentinel-hub.com/sentinel-playground/?source=L8 - AuthorName: Sinergise - AuthorURL: http://www.sinergise.com/ - - Title: "A Gentle Introduction to GDAL Part 4: Working with Satellite Data" - URL: https://medium.com/planet-stories/a-gentle-introduction-to-gdal-part-4-working-with-satellite-data-d3835b5e2971 - AuthorName: Planet - AuthorURL: https://www.planet.com/ - - Title: Exploring the Chile wildfires with Landsat and Sentinel-2 imagery - URL: https://www.gearthblog.com/blog/archives/2017/02/exploring-chile-wildfires-landsat-sentinel-2-imagery.html - AuthorName: Timothy Whitehead - - Title: Using Vector tiles and AWS Lambda, we can build a really simple API to get Landsat and Sentinel images - URL: https://remotepixel.ca/blog/searchapi_20171211.html - AuthorName: Remote Pixel - AuthorURL: https://remotepixel.ca/ - - Title: COG-Explorer - View Cloud Optimized GeoTIFF images in the browser directly from object storage - URL: https://geotiffjs.github.io/cog-explorer/ - AuthorName: EOX - AuthorURL: https://eox.at/ - - Title: Spectator - tracking Landsat 8, accessing the data and quick preview - URL: https://spectator.earth/ - AuthorName: Spectator - AuthorURL: https://spectator.earth/ - - Title: Apps for exploring and analyzing Landsat imagery on the fly - URL: http://www.esri.com/landing-pages/software/landsat/unlock-earths-secrets - AuthorName: Esri - AuthorURL: https://www.esri.com/en-us/home - - Title: Integrate imagery from the full Landsat archive into your own apps, maps, and analysis with Landsat image services - URL: http://www.arcgis.com/home/group.html?id=a74dff13f1be4b2ba7264c3315c57077#overview - AuthorName: Esri - AuthorURL: https://www.esri.com/en-us/home - - Title: EOS Land Viewer - URL: https://eos.com/landviewer/ - AuthorName: Earth Observing System - AuthorURL: https://eos.com/ - - Title: "Aggi: the fire detecting Twitter bot" - URL: https://twitter.com/aggibot - AuthorName: Aggi - AuthorURL: https://twitter.com/aggibot + Tutorials: + - Title: "A Gentle Introduction to GDAL Part 4: Working with Satellite Data" + URL: https://medium.com/planet-stories/a-gentle-introduction-to-gdal-part-4-working-with-satellite-data-d3835b5e2971 + AuthorName: Planet + AuthorURL: https://www.planet.com/ + - Title: Exploring the Chile wildfires with Landsat and Sentinel-2 imagery + URL: https://www.gearthblog.com/blog/archives/2017/02/exploring-chile-wildfires-landsat-sentinel-2-imagery.html + AuthorName: Timothy Whitehead + - Title: Using Vector tiles and AWS Lambda, we can build a really simple API to get Landsat and Sentinel images + URL: https://remotepixel.ca/blog/searchapi_20171211.html + AuthorName: Remote Pixel + AuthorURL: https://remotepixel.ca/ + - Title: Integrate imagery from the full Landsat archive into your own apps, maps, and analysis with Landsat image services + URL: http://www.arcgis.com/home/group.html?id=a74dff13f1be4b2ba7264c3315c57077#overview + AuthorName: Esri + AuthorURL: https://www.esri.com/en-us/home + Tools & Applications: + - Title: EOS Land Viewer + URL: https://eos.com/landviewer/ + AuthorName: Earth Observing System + AuthorURL: https://eos.com/ + - Title: "Aggi: the fire detecting Twitter bot" + URL: https://twitter.com/aggibot + AuthorName: Aggi + AuthorURL: https://twitter.com/aggibot + - Title: COG-Explorer - View Cloud Optimized GeoTIFF images in the browser directly from object storage + URL: https://geotiffjs.github.io/cog-explorer/ + AuthorName: EOX + AuthorURL: https://eox.at/ + - Title: Spectator - tracking Landsat 8, accessing the data and quick preview + URL: https://spectator.earth/ + AuthorName: Spectator + AuthorURL: https://spectator.earth/ + - Title: Apps for exploring and analyzing Landsat imagery on the fly + URL: http://www.esri.com/landing-pages/software/landsat/unlock-earths-secrets + AuthorName: Esri + AuthorURL: https://www.esri.com/en-us/home + - Title: Development Seed Geolambda + URL: https://developmentseed.org/blog/2017/08/17/geolambdas/ + AuthorName: Matthew Hanson + AuthorURL: https://developmentseed.org/team/matt-hanson/ + - Title: FME Landsat-8 on AWS Reader + URL: https://docs.safe.com/fme/html/FME_Desktop_Documentation/FME_ReadersWriters/landsat8aws/landsat8aws.htm + AuthorName: Safe Software + AuthorURL: https://www.safe.com/ + - Title: FME Landsat-8/Sentinel-2 File Selector + URL: http://demos.fmeserver.com/landsat-sentinel-selector/ + AuthorName: Safe Software + AuthorURL: https://www.safe.com/ + - Title: Sentinel Hub WMS/WMTS/WCS Service for Landsat + URL: http://www.sentinel-hub.com/apps/wms + AuthorName: Sinergise + AuthorURL: http://www.sinergise.com/ + - Title: Sentinel Playground for Landsat + URL: https://apps.sentinel-hub.com/sentinel-playground/?source=L8 + AuthorName: Sinergise + AuthorURL: http://www.sinergise.com/ + Publications: + diff --git a/datasets/lofar-elais-n1.yaml b/datasets/lofar-elais-n1.yaml index f7589e9f7..414774a66 100644 --- a/datasets/lofar-elais-n1.yaml +++ b/datasets/lofar-elais-n1.yaml @@ -16,7 +16,10 @@ Resources: Region: us-east-1 Type: S3 Bucket DataAtWork: - - Title: Calibration of LOFAR ELAIS-N1 data in the Amazon cloud - URL: https://www.lofarcloud.uk - AuthorName: J. Sabater - AuthorURL: https://github.com/nudomarinero + Tutorials: + Tools & Applications: + Publications: + - Title: Calibration of LOFAR ELAIS-N1 data in the Amazon cloud + URL: https://www.lofarcloud.uk + AuthorName: J. Sabater + AuthorURL: https://github.com/nudomarinero diff --git a/datasets/medicare-drug-spending.yaml b/datasets/medicare-drug-spending.yaml deleted file mode 100644 index b6dcc4ef5..000000000 --- a/datasets/medicare-drug-spending.yaml +++ /dev/null @@ -1,21 +0,0 @@ -Name: Medicare Drug Spending -Description: | - Finding ways to make Medicare drug spending data more consumable. -Documentation: https://data.world/data4democracy/drug-spending -Contact: https://data.world/data4democracy/drug-spending/discuss -UpdateFrequency: Frequently -Tags: - - pharmaceutical - - statistics - - us -License: CC-BY -Resources: - - Description: Project data files - ARN: arn:aws:s3:::dataworld-odaws-us-east-1/datasets/data4democracy/drug-spending/ - Region: Descrius-east-1 - Type: S3 Bucket -DataAtWork: - - Title: Datasets for and from the drug-spending channel in the Data for Democracy community. - URL: https://data.world/data4democracy/drug-spending - AuthorName: Data for Democracy, @data4democracy on data.world - AuthorURL: https://data.world/data4democracy \ No newline at end of file diff --git a/datasets/meteo-france-models.yaml b/datasets/meteo-france-models.yaml index 86226cf9c..9294c36c5 100644 --- a/datasets/meteo-france-models.yaml +++ b/datasets/meteo-france-models.yaml @@ -35,11 +35,14 @@ Resources: Region: eu-west-1 Type: S3 Bucket DataAtWork: - - Title: Windguru.cz - URL: https://windguru.cz - AuthorName: Windguru - AuthorURL: https://windguru.cz - - Title: Windy.com - URL: https://windy.com - AuthorName: Windy - AuthorURL: https://windy.com + Tutorials: + Tools & Applications: + - Title: Windguru.cz + URL: https://windguru.cz + AuthorName: Windguru + AuthorURL: https://windguru.cz + - Title: Windy.com + URL: https://windy.com + AuthorName: Windy + AuthorURL: https://windy.com + Publications: diff --git a/datasets/mimiciii.yaml b/datasets/mimiciii.yaml new file mode 100644 index 000000000..b362b3bf8 --- /dev/null +++ b/datasets/mimiciii.yaml @@ -0,0 +1,43 @@ +Name: MIMIC-III (‘Medical Information Mart for Intensive Care’) +Description: | + MIMIC-III (‘Medical Information Mart for Intensive Care’) is a large, + single-center database comprising information relating to patients + admitted to critical care units at a large tertiary care hospital. + Data includes vital signs, medications, laboratory measurements, + observations and notes charted by care providers, fluid balance, + procedure codes, diagnostic codes, imaging reports, hospital length + of stay, survival data, and more. The database supports applications + including academic and industrial research, quality improvement initiatives, + and higher education coursework. The MIMIC-III dataset is freely-available. + Researchers seeking to use the database must formally request access. For details, see + [the getting started page](https://mimic.physionet.org/gettingstarted/access/). Once you + have a PhysioNet account, you must enable acccess to the MIMIC-III dataset from your + AWS account. To do this, please [input your AWS account number](https://physionet.org/settings/cloud/), and + [request access to the MIMIC-III Clinical Database on AWS](https://physionet.org/projects/mimiciii/1.4/request_access/2). +Documentation: https://mimic.physionet.org/ +Contact: https://mimic.physionet.org/help/ +UpdateFrequency: Not updated +Tags: + - bioinformatics + - health + - life sciences + - natural language processing + - us +License: https://physionet.org/content/mimiciii/view-license/1.4/ +Resources: + - Description: Project data files + ARN: arn:aws:s3:::mimic-iii-physionet + Region: us-east-1 + Type: S3 Bucket +DataAtWork: + Tutorials: + - Title: Perform biomedical informatics without a database using MIMIC-III data and Amazon Athena + URL: https://aws.amazon.com/blogs/big-data/perform-biomedical-informatics-without-a-database-using-mimic-iii-data-and-amazon-athena/ + AuthorName: James Wiggins, Alistair Johnson + Tools & Applications: + - Title: MIMIC-code GitHub repository + URL: https://github.com/MIT-LCP/mimic-code + AuthorName: Alistair Johnson + AuthorURL: https://github.com/alistairewj + Publications: + diff --git a/datasets/mmid.yaml b/datasets/mmid.yaml index a7ee35973..cccc406ef 100644 --- a/datasets/mmid.yaml +++ b/datasets/mmid.yaml @@ -18,4 +18,8 @@ Resources: Images for words in various languages, packaged by in .tar archives by each language. ARN: arn:aws:s3:::mmid-pds Region: us-east-1 - Type: S3 Bucket \ No newline at end of file + Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/modis.yaml b/datasets/modis.yaml index 932288c7c..ed95fb17d 100644 --- a/datasets/modis.yaml +++ b/datasets/modis.yaml @@ -21,15 +21,18 @@ Resources: Region: us-west-2 Type: SNS Topic DataAtWork: - - Title: Sentinel Hub WMS/WMTS/WCS Service for MODIS - URL: http://www.sentinel-hub.com/apps/wms - AuthorName: Sinergise - AuthorURL: http://www.sinergise.com/ - - Title: Sentinel Playground for MODIS - URL: https://apps.sentinel-hub.com/sentinel-playground/?source=Modis&lat=37.274052809979054&lng=-78.8818359375&zoom=7 - AuthorName: Sinergise - AuthorURL: http://www.sinergise.com/ - - Title: EOS Land Viewer - URL: https://eos.com/landviewer/ - AuthorName: Earth Observing System - AuthorURL: https://eos.com/ + Tutorials: + Tools & Applications: + - Title: Sentinel Hub WMS/WMTS/WCS Service for MODIS + URL: http://www.sentinel-hub.com/apps/wms + AuthorName: Sinergise + AuthorURL: http://www.sinergise.com/ + - Title: Sentinel Playground for MODIS + URL: https://apps.sentinel-hub.com/sentinel-playground/?source=Modis&lat=37.274052809979054&lng=-78.8818359375&zoom=7 + AuthorName: Sinergise + AuthorURL: http://www.sinergise.com/ + - Title: EOS Land Viewer + URL: https://eos.com/landviewer/ + AuthorName: Earth Observing System + AuthorURL: https://eos.com/ + Publications: \ No newline at end of file diff --git a/datasets/mogreps.yaml b/datasets/mogreps.yaml index 030e113f6..14466dbb9 100644 --- a/datasets/mogreps.yaml +++ b/datasets/mogreps.yaml @@ -20,4 +20,8 @@ Resources: - Description: High resolution weather forecast covering the United Kingdom ARN: arn:aws:s3:::mogreps-uk Region: eu-west-2 - Type: S3 Bucket \ No newline at end of file + Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/multimedia-commons.yaml b/datasets/multimedia-commons.yaml index a5dcad6cc..4371758e1 100644 --- a/datasets/multimedia-commons.yaml +++ b/datasets/multimedia-commons.yaml @@ -14,3 +14,7 @@ Resources: ARN: arn:aws:s3:::multimedia-commons Region: us-west-2 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/naip.yaml b/datasets/naip.yaml index 8d33a1081..7a49bc329 100644 --- a/datasets/naip.yaml +++ b/datasets/naip.yaml @@ -31,11 +31,14 @@ Resources: Type: S3 Bucket RequesterPays: True DataAtWork: - - Title: VoyagerSearch showing off Batch + NAIP - URL: https://www.voyagersearch.com/using-aws-batch-to-generate-image-thumbnails-for-voyager - AuthorName: Voyager - AuthorURL: https://www.voyagersearch.com/ - - Title: EOS Land Viewer - URL: https://eos.com/landviewer/ - AuthorName: Earth Observing System - AuthorURL: https://eos.com/ + Tutorials: + Tools & Applications: + - Title: VoyagerSearch showing off Batch + NAIP + URL: https://www.voyagersearch.com/using-aws-batch-to-generate-image-thumbnails-for-voyager + AuthorName: Voyager + AuthorURL: https://www.voyagersearch.com/ + - Title: EOS Land Viewer + URL: https://eos.com/landviewer/ + AuthorName: Earth Observing System + AuthorURL: https://eos.com/ + Publications: \ No newline at end of file diff --git a/datasets/nanopore.yaml b/datasets/nanopore.yaml index 9b476ff5f..83532dd6a 100644 --- a/datasets/nanopore.yaml +++ b/datasets/nanopore.yaml @@ -12,4 +12,8 @@ Resources: - Description: Nanopore Reference Human Genome ARN: arn:aws:s3:::nanopore-human-wgs Region: us-east-1 - Type: S3 Bucket \ No newline at end of file + Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/nasanex.yaml b/datasets/nasanex.yaml index ca3a44a37..17cd19888 100644 --- a/datasets/nasanex.yaml +++ b/datasets/nasanex.yaml @@ -33,11 +33,14 @@ Resources: Region: us-west-2 Type: S3 Bucket DataAtWork: - - Title: Azavea Climate API - URL: https://climate.azavea.com - AuthorName: Azavea - AuthorURL: https://www.azavea.com/ - - Title: Accessing and plotting NASA-NEX data, from GEOSChem-on-cloud tutorial. - URL: http://cloud-gc.readthedocs.io/en/stable/chapter02_beginner-tutorial/use-s3.html#access-nasa-nex-data-in-s3-optional-but-recommended - AuthorName: Jiawei Zhuang - AuthorURL: https://github.com/JiaweiZhuang + Tutorials: + - Title: Accessing and plotting NASA-NEX data, from GEOSChem-on-cloud tutorial. + URL: http://cloud-gc.readthedocs.io/en/stable/chapter02_beginner-tutorial/use-s3.html#access-nasa-nex-data-in-s3-optional-but-recommended + AuthorName: Jiawei Zhuang + AuthorURL: https://github.com/JiaweiZhuang + Tools & Applications: + - Title: Azavea Climate API + URL: https://climate.azavea.com + AuthorName: Azavea + AuthorURL: https://www.azavea.com/ + Publications: diff --git a/datasets/nfa.yaml b/datasets/nfa.yaml deleted file mode 100644 index 8cddf1cc8..000000000 --- a/datasets/nfa.yaml +++ /dev/null @@ -1,24 +0,0 @@ -Name: NFA 2017 - Ecological Resource Use and Resource Capacity of Nations from 1961 to 2013 -Description: | - Our National Footprint Accounts (NFAs) measure the ecological resource use and resource capacity of nations from 1961 to 2013. - The calculations in the National Footprint Accounts are primarily based on United Nations data sets, including those published by the Food and Agriculture Organization, United Nations Commodity Trade Statistics Database, and the UN Statistics Division, as well as the International Energy Agency. -Contact: https://data.world/footprint/nfa-2017-edition/discuss -UpdateFrequency: Annually -Documentation: https://data.world/footprint/nfa-2017-edition -Tags: - - environmental - - climate - - economics - - life sciences - - sustainability -License: CC-BY-SA -Resources: - - Description: Project data files - ARN: arn:aws:s3:::dataworld-odaws-us-east-1/datasets/footprint/nfa-2017-edition/ - Region: us-east-1 - Type: S3 Bucket -DataAtWork: - - Title: Primarily based on United Nations data sets - URL: https://data.world/footprint/nfa-2017-edition - AuthorName: Global Footprint Network, @footprint on data.world - AuthorURL: https://data.world/footprint \ No newline at end of file diff --git a/datasets/noaa-gefs.yaml b/datasets/noaa-gefs.yaml index bf0edd03d..cdd66c1b3 100644 --- a/datasets/noaa-gefs.yaml +++ b/datasets/noaa-gefs.yaml @@ -1,5 +1,5 @@ Name: NOAA Global Ensemble Forecast System (GEFS) -Description: The Global Ensemble Forecast System (GEFS), previously known as the GFS Global ENSemble (GENS), is a weather forecast model made up of 21 separate forecasts, or ensemble members. The National Centers for Environmental Prediction (NCEP) started the GEFS to address the nature of uncertainty in weather observations, which is used to initialize weather forecast models. The GEFS attempts to quantify the amount of uncertainty in a forecast by generating an ensemble of multiple forecasts, each minutely different, or perturbed, from the original observations. With global coverage, GEFS is produced four times a day with weather forecasts going out to 16 days. +Description: The Global Ensemble Forecast System (GEFS), previously known as the GFS Global ENSemble (GENS), is a weather forecast model made up of 21 separate forecasts, or ensemble members. The National Centers for Environmental Prediction (NCEP) started the GEFS to address the nature of uncertainty in weather observations, which is used to initialize weather forecast models. The GEFS attempts to quantify the amount of uncertainty in a forecast by generating an ensemble of multiple forecasts, each minutely different, or perturbed, from the original observations. With global coverage, GEFS is produced four times a day with weather forecasts going out to 16 days. Documentation: https://docs.opendata.aws/noaa-gefs-pds/readme.html Contact: For questions regarding data content or quality, visit [the NOAA GEFS site](http://www.emc.ncep.noaa.gov/index.php?branch=GEFS). For any questions regarding data delivery not associated with this platform or any general questions regarding the NOAA Big Data Project, email noaa.bdp@noaa.gov ManagedBy: "[NOAA](http://www.noaa.gov/)" @@ -16,3 +16,7 @@ Resources: ARN: arn:aws:s3:::noaa-gefs-pds Region: us-east-1 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/noaa-gfs-bdp-pds.yaml b/datasets/noaa-gfs-bdp-pds.yaml index 4b94b9a25..086199f6a 100644 --- a/datasets/noaa-gfs-bdp-pds.yaml +++ b/datasets/noaa-gfs-bdp-pds.yaml @@ -42,3 +42,7 @@ Resources: ARN: arn:aws:sns:us-east-1:123901341784:NewGFSParaObject Region: us-east-1 Type: SNS Topic +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/noaa-gfs-pds.yaml b/datasets/noaa-gfs-pds.yaml index 0fc3aaf9f..58eaa756d 100644 --- a/datasets/noaa-gfs-pds.yaml +++ b/datasets/noaa-gfs-pds.yaml @@ -22,7 +22,10 @@ Resources: Region: us-east-1 Type: SNS Topic DataAtWork: - - Title: "PODPAC: Python Library supporting GFS for analysis" - URL: https://podpac.org/datasets.html#gfs - AuthorName: Creare - AuthorURL: http://www.creare.com/ + Tutorials: + Tools & Applications: + - Title: "PODPAC: Python Library supporting GFS for analysis" + URL: https://podpac.org/datasets.html#gfs + AuthorName: Creare + AuthorURL: http://www.creare.com/ + Publications: diff --git a/datasets/noaa-ghcn.yaml b/datasets/noaa-ghcn.yaml index 0f6c42fb8..5b36ed190 100644 --- a/datasets/noaa-ghcn.yaml +++ b/datasets/noaa-ghcn.yaml @@ -17,6 +17,9 @@ Resources: Region: us-east-1 Type: S3 Bucket DataAtWork: - - Title: Visualize over 200 years of global climate data using Amazon Athena and Amazon QuickSight - URL: https://aws.amazon.com/blogs/big-data/visualize-over-200-years-of-global-climate-data-using-amazon-athena-and-amazon-quicksight/ - AuthorName: Conor Delaney + Tutorials: + - Title: Visualize over 200 years of global climate data using Amazon Athena and Amazon QuickSight + URL: https://aws.amazon.com/blogs/big-data/visualize-over-200-years-of-global-climate-data-using-amazon-athena-and-amazon-quicksight/ + AuthorName: Conor Delaney + Tools & Applications: + Publications: diff --git a/datasets/noaa-ghcnh.yaml b/datasets/noaa-ghcnh.yaml index 68ea9d659..45ee163a6 100644 --- a/datasets/noaa-ghcnh.yaml +++ b/datasets/noaa-ghcnh.yaml @@ -28,3 +28,7 @@ Resources: ARN: arn:aws:s3:::noaa-global-hourly-pds Region: us-east-1 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/noaa-ghe.yaml b/datasets/noaa-ghe.yaml index fdd390ac7..73f11a3d2 100644 --- a/datasets/noaa-ghe.yaml +++ b/datasets/noaa-ghe.yaml @@ -30,3 +30,11 @@ Resources: ARN: arn:aws:s3:::noaa-ghe-pds Region: us-east-1 Type: S3 Bucket + - Description: New data notifications for GHE, only Lambda and SQS protocols allowed + ARN: arn:aws:sns:us-east-1:123901341784:NewGHEObject + Region: us-east-1 + Type: SNS Topic +DataAtWork: + Tutorials: + Tools & Applications: + Publications: diff --git a/datasets/noaa-goes.yaml b/datasets/noaa-goes.yaml index dc1e495ad..89191f1de 100644 --- a/datasets/noaa-goes.yaml +++ b/datasets/noaa-goes.yaml @@ -41,10 +41,13 @@ Resources: Region: us-east-1 Type: SNS Topic DataAtWork: - - Title: Billions of Birds Migrate. Where Do They Go? - URL: https://www.nationalgeographic.com/magazine/2018/03/bird-migration-interactive-maps/ - AuthorName: National Geographic - - Title: Visualize GOES-16 in Python using Xarray - URL: https://github.com/HamedAlemo/visualize-goes16 - AuthorName: Hamed Alemohammad - AuthorURL: https://www.linkedin.com/in/hamedalemohammad/ + Tutorials: + - Title: Visualize GOES-16 in Python using Xarray + URL: https://github.com/HamedAlemo/visualize-goes16 + AuthorName: Hamed Alemohammad + AuthorURL: https://www.linkedin.com/in/hamedalemohammad/ + Tools & Applications: + Publications: + - Title: Billions of Birds Migrate. Where Do They Go? + URL: https://www.nationalgeographic.com/magazine/2018/03/bird-migration-interactive-maps/ + AuthorName: National Geographic diff --git a/datasets/noaa-gsod.yaml b/datasets/noaa-gsod.yaml index 24df38aa5..8e4dcb257 100644 --- a/datasets/noaa-gsod.yaml +++ b/datasets/noaa-gsod.yaml @@ -17,4 +17,8 @@ Resources: - Description: Measurements and metadata ARN: arn:aws:s3:::aws-gsod Region: us-east-1 - Type: S3 Bucket \ No newline at end of file + Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/noaa-hrrr-pds.yaml b/datasets/noaa-hrrr-pds.yaml index 0bf8cf55b..6ed220077 100644 --- a/datasets/noaa-hrrr-pds.yaml +++ b/datasets/noaa-hrrr-pds.yaml @@ -21,3 +21,7 @@ Resources: ARN: arn:aws:sns:us-east-1:104891172899:noaa-hrrr-pds Region: us-east-1 Type: SNS Topic +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/noaa-isd.yaml b/datasets/noaa-isd.yaml index 8f0e7969c..8cb4b176e 100644 --- a/datasets/noaa-isd.yaml +++ b/datasets/noaa-isd.yaml @@ -38,3 +38,7 @@ Resources: ARN: arn:aws:s3:::noaa-isd-pds Region: us-east-1 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/noaa-nexrad.yaml b/datasets/noaa-nexrad.yaml index 6366c7436..3df258361 100644 --- a/datasets/noaa-nexrad.yaml +++ b/datasets/noaa-nexrad.yaml @@ -30,23 +30,32 @@ Resources: Region: us-east-1 Type: SNS Topic DataAtWork: - - Title: Using Python to Access NCEI Archived NEXRAD Level 2 Data (Jupyter notebook) - URL: http://nbviewer.jupyter.org/gist/dopplershift/356f2e14832e9b676207 - AuthorName: Ryan May - AuthorURL: http://dopplershift.github.io - - Title: Mapping Noaa Nexrad Radar Data With CARTO - URL: https://carto.com/blog/mapping-nexrad-radar-data/ - AuthorName: Stuart Lynn - AuthorURL: https://carto.com/blog/author/stuart-lynn/ - - Title: NEXRAD on EC2 tutorial - URL: https://github.com/openradar/AMS_radar_in_the_cloud - AuthorName: openradar - AuthorURL: https://github.com/openradar - - Title: nexradaws on pypi.python.org - python module to query and download Nexrad data from Amazon S3 - URL: https://pypi.org/project/nexradaws/ - AuthorName: Aaron Anderson - AuthorURL: https://github.com/aarande - - Title: WeatherPipe - Amazon EMR based analysis tool for NEXRAD data stored on Amazon S3 - URL: https://github.com/stephenlienharrell/WeatherPipe - AuthorName: Stephen Lien Harrell - AuthorURL: https://github.com/stephenlienharrell + Tutorials: + - Title: Using Python to Access NCEI Archived NEXRAD Level 2 Data (Jupyter notebook) + URL: http://nbviewer.jupyter.org/gist/dopplershift/356f2e14832e9b676207 + AuthorName: Ryan May + AuthorURL: http://dopplershift.github.io + - Title: Mapping Noaa Nexrad Radar Data With CARTO + URL: https://carto.com/blog/mapping-nexrad-radar-data/ + AuthorName: Stuart Lynn + AuthorURL: https://carto.com/blog/author/stuart-lynn/ + - Title: NEXRAD on EC2 tutorial + URL: https://github.com/openradar/AMS_radar_in_the_cloud + AuthorName: openradar + AuthorURL: https://github.com/openradar + Tools & Applications: + - Title: nexradaws on pypi.python.org - python module to query and download Nexrad data from Amazon S3 + URL: https://pypi.org/project/nexradaws/ + AuthorName: Aaron Anderson + AuthorURL: https://github.com/aarande + - Title: WeatherPipe - Amazon EMR based analysis tool for NEXRAD data stored on Amazon S3 + URL: https://github.com/stephenlienharrell/WeatherPipe + AuthorName: Stephen Lien Harrell + AuthorURL: https://github.com/stephenlienharrell + Publications: + - Title: Seasonal abundance and survival of North America’s migratory avifauna determined by weather radar + URL: https://www.nature.com/articles/s41559-018-0666-4 + AuthorName: Adriaan M. Dokter, Andrew Farnsworth, Daniel Fink, Viviana Ruiz-Gutierrez, Wesley M. Hochachka, Frank A. La Sorte, Orin J. Robinson, Kenneth V. Rosenberg & Steve Kelling + - Title: Unlocking the Potential of NEXRAD Data through NOAA’s Big Data Partnership + URL: https://journals.ametsoc.org/doi/full/10.1175/BAMS-D-16-0021.1 + AuthorName: Steve Ansari and Stephen Del Greco \ No newline at end of file diff --git a/datasets/noaa-nwm-pds.yaml b/datasets/noaa-nwm-pds.yaml index 2702ea339..4243d5b26 100644 --- a/datasets/noaa-nwm-pds.yaml +++ b/datasets/noaa-nwm-pds.yaml @@ -33,4 +33,7 @@ Resources: ARN: arn:aws:s3:::noaa-nwm-pds Region: us-east-1 Type: S3 Bucket - +DataAtWork: + Tutorials: + Tools & Applications: + Publications: diff --git a/datasets/noaa-ofs.yaml b/datasets/noaa-ofs.yaml index 42db2e677..968938ca5 100644 --- a/datasets/noaa-ofs.yaml +++ b/datasets/noaa-ofs.yaml @@ -21,3 +21,7 @@ Resources: ARN: arn:aws:s3:::noaa-ofs-pds Region: us-east-1 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/nrel-pds-nsrdb.yaml b/datasets/nrel-pds-nsrdb.yaml index 6b14e0bad..dfe15e674 100644 --- a/datasets/nrel-pds-nsrdb.yaml +++ b/datasets/nrel-pds-nsrdb.yaml @@ -12,7 +12,7 @@ ManagedBy: '[National Renewable Energy Laboratory](https://www.nrel.gov/)' UpdateFrequency: As Needed Tags: - aws-pds - - earth observation + - earth observation - energy - geospatial - meteorological @@ -29,9 +29,12 @@ Resources: Region: us-west-2 Type: S3 Bucket DataAtWork: - - Title: The National Solar Radiation Data Base (NSRDB) - URL: https://www.sciencedirect.com/science/article/pii/S136403211830087X - AuthorName: Manajit Sengupta, Yu Xe, Anthony Lopez, Aron Habte, Galen Maclaurin, James Shelby - - Title: NSRDB Viewer - URL: https://nsrdb.nrel.gov/nsrdb-viewer - AuthorName: Manajit Sengupta, Yu Xe, Anthony Lopez, Aron Habte, Galen Maclaurin, James Shelby, Paul Edwards + Tutorials: + Tools & Applications: + - Title: NSRDB Viewer + URL: https://nsrdb.nrel.gov/nsrdb-viewer + AuthorName: Manajit Sengupta, Yu Xe, Anthony Lopez, Aron Habte, Galen Maclaurin, James Shelby, Paul Edwards + Publications: + - Title: The National Solar Radiation Data Base (NSRDB) + URL: https://www.sciencedirect.com/science/article/pii/S136403211830087X + AuthorName: Manajit Sengupta, Yu Xe, Anthony Lopez, Aron Habte, Galen Maclaurin, James Shelby diff --git a/datasets/nrel-pds-wtk.yaml b/datasets/nrel-pds-wtk.yaml index 7e64f3d23..25a5723e3 100644 --- a/datasets/nrel-pds-wtk.yaml +++ b/datasets/nrel-pds-wtk.yaml @@ -41,15 +41,18 @@ Resources: Region: us-west-2 Type: S3 Bucket DataAtWork: - - Title: 'Power from wind: Open data on AWS' - URL: https://aws.amazon.com/blogs/big-data/power-from-wind-open-data-on-aws/ - AuthorName: Caleb Phillips, Caroline Draxl, John Readey, Jordan Perr-Sauer - AuthorURL: https://www.nrel.gov/research/caleb-phillips.html - - Title: HSDS Examples - URL: https://github.com/NREL/hsds-examples - AuthorName: Caleb Phillips, Caroline Draxl, John Readey, Jordan Perr-Sauer - AuthorURL: https://www.nrel.gov/research/caleb-phillips.html - - Title: Wind Visualization - URL: https://github.com/NREL/hsds-viz - AuthorName: Jordan Perr-Sauer - AuthorURL: https://www.nrel.gov/research/jordan-perr-sauer.html + Tutorials: + Tools & Applications: + - Title: HSDS Examples + URL: https://github.com/NREL/hsds-examples + AuthorName: Caleb Phillips, Caroline Draxl, John Readey, Jordan Perr-Sauer + AuthorURL: https://www.nrel.gov/research/caleb-phillips.html + - Title: Wind Visualization + URL: https://github.com/NREL/hsds-viz + AuthorName: Jordan Perr-Sauer + AuthorURL: https://www.nrel.gov/research/jordan-perr-sauer.html + Publications: + - Title: 'Power from wind: Open data on AWS' + URL: https://aws.amazon.com/blogs/big-data/power-from-wind-open-data-on-aws/ + AuthorName: Caleb Phillips, Caroline Draxl, John Readey, Jordan Perr-Sauer + AuthorURL: https://www.nrel.gov/research/caleb-phillips.html diff --git a/datasets/nwm-archive.yaml b/datasets/nwm-archive.yaml index 6660c8702..91ce8fabb 100644 --- a/datasets/nwm-archive.yaml +++ b/datasets/nwm-archive.yaml @@ -1,25 +1,24 @@ Name: NOAA National Water Model Reanalysis Description: | The NOAA National Water Model Reanalysis dataset contains output - from a 25-year retrospective simulation (January 1993 through - December 2017) of version 1.2 of the National Water Model. This - simulation used observed rainfall as input and ingested other - required meteorological input fields from a weather Reanalysis + from multi-decade retrospective simulations. These + simulations used observed rainfall as input and ingested other + required meteorological input fields from a weather reanalysis dataset. The output frequency and fields available in this historical NWM dataset differ from those contained in the real-time forecast model. One application of this dataset is to provide historical context to current real-time streamflow, - soil moisture and snowpack NWM conditions. The Reanalysis data + soil moisture and snowpack NWM conditions. The reanalysis data can be used to infer flow frequencies and perform temporal analyses with hourly streamflow output and 3-hourly land surface output. The long-term dataset can also be used in the development of end user applications which require a long baseline of data for system training or verification purposes. This dataset contains output from two - retrospective simulations. A 25-year retrospective simulation using version - 1.2 of the National Water Model (January 1993 through December 2017), and a - 26-year retrospective simulation using version 2.0 of the National Water Model - (January 1993 through December 2018). Version 2.0 of the National Water Model - was implemented into operations with the 12UTC run on June 19, 2019. + retrospective simulations. Currently there are two versions of the dataset: + A 25-year (January 1993 through December 2017) retrospective simulation using + version 1.2 of the National Water Model, and a 26-year (January 1993 through + December 2018) retrospective simulation using version 2.0 + of the National Water Model. Documentation: https://docs.opendata.aws/nwm-archive/readme.html Contact: | For questions regarding data content or quality, go [here](http://water.noaa.gov/about/nwm). @@ -42,7 +41,11 @@ Resources: ARN: arn:aws:s3:::noaa-nwm-retro-v2.0-pds Region: us-east-1 Type: S3 Bucket - - Description: The complete archive of NWM data. + - Description: The complete archive of NWM data version 1.2. ARN: arn:aws:s3:::nwm-archive Region: us-east-1 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/nyc-tlc-trip-records-pds.yaml b/datasets/nyc-tlc-trip-records-pds.yaml index daddbe15f..7055fb8bd 100644 --- a/datasets/nyc-tlc-trip-records-pds.yaml +++ b/datasets/nyc-tlc-trip-records-pds.yaml @@ -15,15 +15,18 @@ Resources: Region: us-east-1 Type: S3 Bucket DataAtWork: - - Title: Deep Dive on Flink & Spark on Amazon EMR - URL: https://www.youtube.com/watch?v=MzTZp47Jy7E - AuthorName: Keith Steward - - Title: Build a Real-time Stream Processing Pipeline with Apache Flink on AWS - URL: https://aws.amazon.com/blogs/big-data/build-a-real-time-stream-processing-pipeline-with-apache-flink-on-aws/ - AuthorName: Steffen Hausmann - - Title: Exploring data with Python and Amazon S3 Select - URL: https://github.com/aws-samples/aws-open-data-analytics-notebooks/tree/master/exploring-data - AuthorName: Manav Sehgal - - Title: Optimizing data for analysis with Amazon Athena and AWS Glue - URL: https://github.com/aws-samples/aws-open-data-analytics-notebooks/tree/master/optimizing-data - AuthorName: Manav Sehgal + Tutorials: + - Title: Deep Dive on Flink & Spark on Amazon EMR + URL: https://www.youtube.com/watch?v=MzTZp47Jy7E + AuthorName: Keith Steward + - Title: Build a Real-time Stream Processing Pipeline with Apache Flink on AWS + URL: https://aws.amazon.com/blogs/big-data/build-a-real-time-stream-processing-pipeline-with-apache-flink-on-aws/ + AuthorName: Steffen Hausmann + - Title: Exploring data with Python and Amazon S3 Select + URL: https://github.com/aws-samples/aws-open-data-analytics-notebooks/tree/master/exploring-data + AuthorName: Manav Sehgal + - Title: Optimizing data for analysis with Amazon Athena and AWS Glue + URL: https://github.com/aws-samples/aws-open-data-analytics-notebooks/tree/master/optimizing-data + AuthorName: Manav Sehgal + Tools & Applications: + Publications: diff --git a/datasets/ooni.yaml b/datasets/ooni.yaml index 94e63093a..ac36640f4 100644 --- a/datasets/ooni.yaml +++ b/datasets/ooni.yaml @@ -12,3 +12,7 @@ Resources: ARN: arn:aws:s3:::ooni-data Region: us-east-1 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/openaq.yaml b/datasets/openaq.yaml index 5b3acdc67..0d31a39e4 100644 --- a/datasets/openaq.yaml +++ b/datasets/openaq.yaml @@ -29,22 +29,29 @@ Resources: Region: us-east-1 Type: CloudFront Distribution DataAtWork: - - Title: "Smokey: Air Quality Bot" - URL: https://www.facebook.com/smokeybot/ - AuthorName: Amrit Sharma - AuthorURL: https://twitter.com/amrit_sharma - - Title: ropenaq R package - URL: https://github.com/ropensci/ropenaq - AuthorName: Maëlle Salmon - AuthorURL: https://github.com/maelle - - Title: hackAIR - URL: http://www.hackair.eu/ - AuthorName: hackAir - - Title: ARISense - URL: https://arisense.io/ - AuthorName: Aerodyne Research, Inc. - AuthorURL: http://www.aerodyne.com/ - - Title: Access OpenAQ data via a filterable SNS topic - URL: https://medium.com/@openaq/get-faster-access-to-real-time-air-quality-data-from-around-the-world-c6f9793d5242 - AuthorName: OpenAQ - AuthorURL: https://openaq.org + Tutorials: + - Title: Access OpenAQ data via a filterable SNS topic + URL: https://medium.com/@openaq/get-faster-access-to-real-time-air-quality-data-from-around-the-world-c6f9793d5242 + AuthorName: OpenAQ + AuthorURL: https://openaq.org + - Title: Using Athena to access the whole archive + URL: https://medium.com/@openaq/how-in-the-world-do-you-access-air-quality-data-older-than-90-days-on-the-openaq-platform-8562df519ecd + AuthorName: OpenAQ + AuthorURL: https://openaq.org + Tools & Applications: + - Title: "Smokey: Air Quality Bot" + URL: https://www.facebook.com/smokeybot/ + AuthorName: Amrit Sharma + AuthorURL: https://twitter.com/amrit_sharma + - Title: ropenaq R package + URL: https://github.com/ropensci/ropenaq + AuthorName: Maëlle Salmon + AuthorURL: https://github.com/maelle + - Title: hackAIR + URL: http://www.hackair.eu/ + AuthorName: hackAir + - Title: ARISense + URL: https://arisense.io/ + AuthorName: Aerodyne Research, Inc. + AuthorURL: http://www.aerodyne.com/ + Publications: diff --git a/datasets/opencitymodel.yaml b/datasets/opencitymodel.yaml index 7b795430b..13ebd4a79 100644 --- a/datasets/opencitymodel.yaml +++ b/datasets/opencitymodel.yaml @@ -17,11 +17,14 @@ Resources: Region: us-east-1 Type: S3 Bucket DataAtWork: - - Title: Using Open City Model with the 3dCityDB - URL: https://github.com/opencitymodel/opencitymodel/blob/master/examples/3dCityDB-to-GoogleEarth.md - AuthorName: Allen Gilliland - AuthorURL: https://github.com/agilliland - - Title: Running queries on Open City Model using AWS Athena - URL: https://github.com/opencitymodel/opencitymodel/blob/master/examples/Query-OpenCityModel-using-AWS-Athena.md - AuthorName: Allen Gilliland - AuthorURL: https://github.com/agilliland + Tutorials: + - Title: Using Open City Model with the 3dCityDB + URL: https://github.com/opencitymodel/opencitymodel/blob/master/examples/3dCityDB-to-GoogleEarth.md + AuthorName: Allen Gilliland + AuthorURL: https://github.com/agilliland + - Title: Running queries on Open City Model using AWS Athena + URL: https://github.com/opencitymodel/opencitymodel/blob/master/examples/Query-OpenCityModel-using-AWS-Athena.md + AuthorName: Allen Gilliland + AuthorURL: https://github.com/agilliland + Tools & Applications: + Publications: diff --git a/datasets/openneuro.yaml b/datasets/openneuro.yaml index f5117ceb1..5598f0d7d 100644 --- a/datasets/openneuro.yaml +++ b/datasets/openneuro.yaml @@ -15,3 +15,7 @@ Resources: ARN: arn:aws:s3:::openneuro.org Region: us-east-1 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/osm.yaml b/datasets/osm.yaml index c424cf3a0..5407b9ee9 100644 --- a/datasets/osm.yaml +++ b/datasets/osm.yaml @@ -21,18 +21,21 @@ Resources: Region: us-east-1 Type: SNS Topic DataAtWork: - - Title: OSM+Athena (GitHub) - URL: https://github.com/developmentseed/mrworldwide/ - AuthorName: Development Seed - AuthorURL: https://developmentseed.org/ - - Title: Querying OpenStreetMap with Amazon Athena - URL: https://aws.amazon.com/blogs/big-data/querying-openstreetmap-with-amazon-athena/ - AuthorName: Seth Fitzsimmons - AuthorURL: https://github.com/mojodna - - Title: Develop and Extract Value from Open Data - URL: https://aws.amazon.com/blogs/publicsector/develop-and-extract-value-from-open-data/ - AuthorName: Daniel Bernao - - Title: "PlanetUtils (GitHub): Scripts and a Docker container to maintain your own OpenStreetMap planet" - URL: https://github.com/interline-io/planetutils - AuthorName: Interline Technologies - AuthorURL: https://www.interline.io/ + Tutorials: + - Title: Querying OpenStreetMap with Amazon Athena + URL: https://aws.amazon.com/blogs/big-data/querying-openstreetmap-with-amazon-athena/ + AuthorName: Seth Fitzsimmons + AuthorURL: https://github.com/mojodna + - Title: Develop and Extract Value from Open Data + URL: https://aws.amazon.com/blogs/publicsector/develop-and-extract-value-from-open-data/ + AuthorName: Daniel Bernao + Tools & Applications: + - Title: "PlanetUtils (GitHub): Scripts and a Docker container to maintain your own OpenStreetMap planet" + URL: https://github.com/interline-io/planetutils + AuthorName: Interline Technologies + AuthorURL: https://www.interline.io/ + - Title: OSM+Athena (GitHub) + URL: https://github.com/developmentseed/mrworldwide/ + AuthorName: Development Seed + AuthorURL: https://developmentseed.org/ + Publications: diff --git a/datasets/osmlr.yaml b/datasets/osmlr.yaml index de5ae89c8..7535e2485 100644 --- a/datasets/osmlr.yaml +++ b/datasets/osmlr.yaml @@ -16,3 +16,7 @@ Resources: ARN: arn:aws:s3:::osmlr Region: us-east-1 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/paracrawl.yaml b/datasets/paracrawl.yaml index 9f0792247..20344b3d7 100644 --- a/datasets/paracrawl.yaml +++ b/datasets/paracrawl.yaml @@ -11,7 +11,11 @@ Tags: - natural language processing License: Creative Commons CC0 license ("no rights reserved"). Resources: - - Description: Parallel Corpora to/from English for all official EU languages + - Description: Parallel Corpora to/from English for all official EU languages ARN: arn:aws:s3:::web-language-models Region: us-east-1 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/physionet.yaml b/datasets/physionet.yaml index 86037fdb9..6afbeee94 100644 --- a/datasets/physionet.yaml +++ b/datasets/physionet.yaml @@ -12,4 +12,8 @@ Resources: - Description: https://s3.amazonaws.com/physionet-pds/index.html ARN: arn:aws:s3:::physionet-pds Region: us-east-1 - Type: S3 Bucket \ No newline at end of file + Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/qiime2.yaml b/datasets/qiime2.yaml index 7202d3486..9deb257fc 100644 --- a/datasets/qiime2.yaml +++ b/datasets/qiime2.yaml @@ -24,11 +24,10 @@ Resources: Region: us-west-2 Type: S3 Bucket DataAtWork: - - Title: QIIME 2 User Documentation - URL: https://docs.qiime2.org - AuthorName: The QIIME 2 Development Team - AuthorURL: https://github.com/qiime2/docs/graphs/contributors - - Title: Installing QIIME 2 using Amazon Web Services - URL: https://docs.qiime2.org/2018.11/install/virtual/aws/ - AuthorName: The QIIME 2 Development Team - AuthorURL: https://github.com/qiime2/docs/graphs/contributors + Tutorials: + - Title: Installing QIIME 2 using Amazon Web Services + URL: https://docs.qiime2.org/2018.11/install/virtual/aws/ + AuthorName: The QIIME 2 Development Team + AuthorURL: https://github.com/qiime2/docs/graphs/contributors + Tools & Applications: + Publications: diff --git a/datasets/rapid7-fdns-any.yaml b/datasets/rapid7-fdns-any.yaml index 47cfc7ac1..11f788142 100644 --- a/datasets/rapid7-fdns-any.yaml +++ b/datasets/rapid7-fdns-any.yaml @@ -19,8 +19,8 @@ Resources: - Description: | FDNS ANY Gzip-compressed parquet files following a HIVE partitioning model, with a 90-day retention period. This dataset represents the data returned for a name - when an ANY query is issued. Data is partitioned by date=YYYYMM which is the - year-month that the FDNS ANY study was launched. + when an ANY query is issued. Data is partitioned by date=YYYYMM which is the + year-month that the FDNS ANY study was launched. ARN: arn:aws:s3:::rapid7-opendata/fdns/any/v1/ Region: us-east-1 Type: S3 Bucket @@ -30,11 +30,14 @@ Resources: Region: us-east-1 Type: SNS Topic DataAtWork: - - Title: How to Conduct DNS Reconnaissance for $.02 Using Rapid7 Open Data and AWS - URL: https://blog.rapid7.com/2018/10/16/how-to-conduct-dns-reconnaissance-for-02-using-rapid7-open-data-and-aws/ - AuthorName: Shan Sikdar at Rapid7 - AuthorURL: https://blog.rapid7.com/author/shan/ - - Title: Creating a Project Sonar FDNS API with AWS - URL: http://securityriskadvisors.com/blog/creating-a-project-sonar-fdns-api-with-aws/ - AuthorName: Evan Perotti at SecurityRiskAdvisors - AuthorURL: https://twitter.com/2xxeformyshirt + Tutorials: + - Title: How to Conduct DNS Reconnaissance for $.02 Using Rapid7 Open Data and AWS + URL: https://blog.rapid7.com/2018/10/16/how-to-conduct-dns-reconnaissance-for-02-using-rapid7-open-data-and-aws/ + AuthorName: Shan Sikdar at Rapid7 + AuthorURL: https://blog.rapid7.com/author/shan/ + - Title: Creating a Project Sonar FDNS API with AWS + URL: http://securityriskadvisors.com/blog/creating-a-project-sonar-fdns-api-with-aws/ + AuthorName: Evan Perotti at SecurityRiskAdvisors + AuthorURL: https://twitter.com/2xxeformyshirt + Tools & Applications: + Publications: diff --git a/datasets/sacred-word-counts.yaml b/datasets/sacred-word-counts.yaml deleted file mode 100644 index d56020655..000000000 --- a/datasets/sacred-word-counts.yaml +++ /dev/null @@ -1,20 +0,0 @@ -Name: Translated Sacred Text Word Counts -Description: | - Counts of words used in English-language translations of sacred texts, with flag for common words. -Contact: https://data.world/dataremixed/sacred-text-word-counts/discuss -Documentation: https://data.world/dataremixed/sacred-text-word-counts -UpdateFrequency: Unknown -Tags: - - natural language processing - - machine learning -License: Public Domain -Resources: - - Description: Project data files - ARN: arn:aws:s3:::dataworld-odaws-us-east-1/datasets/dataremixed/sacred-text-word-counts/ - Region: us-east-1 - Type: S3 Bucket -DataAtWork: - - Title: Sacred writings from gutenberg.org - URL: https://data.world/dataremixed/sacred-text-word-counts - AuthorName: "@dataremixed on data.world" - AuthorURL: https://data.world/dataremixed \ No newline at end of file diff --git a/datasets/safecast.yaml b/datasets/safecast.yaml index 0a4d88bf3..9bb2cc933 100644 --- a/datasets/safecast.yaml +++ b/datasets/safecast.yaml @@ -24,7 +24,10 @@ Resources: Region: us-west-2 Type: SNS Topic DataAtWork: - - Title: Safecast Map - URL: http://safecast.org/tilemap/ - AuthorName: Nick Dolezal - AuthorURL: https://github.com/frangible + Tutorials: + Tools & Applications: + - Title: Safecast Map + URL: http://safecast.org/tilemap/ + AuthorName: Nick Dolezal + AuthorURL: https://github.com/frangible + Publications: diff --git a/datasets/schweizer-haltestellen-oev.yaml b/datasets/schweizer-haltestellen-oev.yaml index ede8b0b18..5533f89d5 100644 --- a/datasets/schweizer-haltestellen-oev.yaml +++ b/datasets/schweizer-haltestellen-oev.yaml @@ -18,7 +18,10 @@ Resources: Region: eu-west-1 Type: S3 Bucket DataAtWork: - - Title: Map Viewer - URL: https://map.geo.admin.ch/?layers=ch.bav.haltestellen-oev - AuthorName: Swiss Geoportal - AuthorURL: https://twitter.com/swiss_geoportal + Tutorials: + Tools & Applications: + - Title: Map Viewer + URL: https://map.geo.admin.ch/?layers=ch.bav.haltestellen-oev + AuthorName: Swiss Geoportal + AuthorURL: https://twitter.com/swiss_geoportal + Publications: diff --git a/datasets/sentinel-1.yaml b/datasets/sentinel-1.yaml index 3cd455a46..f426505b1 100644 --- a/datasets/sentinel-1.yaml +++ b/datasets/sentinel-1.yaml @@ -28,19 +28,22 @@ Resources: Region: eu-central-1 Type: SNS Topic DataAtWork: - - Title: Sentinel Playground - URL: https://apps.sentinel-hub.com/sentinel-playground/?baseWmsUrl=services.sentinel-hub.com&instanceID=a7c04225-b861-452d-ac89-7765352cd855&source=S2&lat=40.98676619345964&lng=28.89301300048828&zoom=13&preset=IW_VV&layers=B04,B03,B02&maxcc=20&gain=1.0&gamma=1.0&time=2015-01-01%7C2018-01-16&atmFilter=&showDates=false - AuthorName: Sinergise - AuthorURL: http://www.sinergise.com/ - - Title: Sentinel Hub WMS/WMTS/WCS Service by Sinergise - URL: http://www.sentinel-hub.com/apps/wms - AuthorName: Sinergise - AuthorURL: http://www.sinergise.com/ - - Title: EOS Land Viewer - URL: https://eos.com/landviewer/ - AuthorName: Earth Observing System - AuthorURL: https://eos.com/ - - Title: EO Browser - URL: http://apps.sentinel-hub.com/eo-browser/ - AuthorName: Sinergise - AuthorURL: http://www.sinergise.com/ + Tutorials: + Tools & Applications: + - Title: Sentinel Playground + URL: https://apps.sentinel-hub.com/sentinel-playground/?baseWmsUrl=services.sentinel-hub.com&instanceID=a7c04225-b861-452d-ac89-7765352cd855&source=S2&lat=40.98676619345964&lng=28.89301300048828&zoom=13&preset=IW_VV&layers=B04,B03,B02&maxcc=20&gain=1.0&gamma=1.0&time=2015-01-01%7C2018-01-16&atmFilter=&showDates=false + AuthorName: Sinergise + AuthorURL: http://www.sinergise.com/ + - Title: Sentinel Hub WMS/WMTS/WCS Service by Sinergise + URL: http://www.sentinel-hub.com/apps/wms + AuthorName: Sinergise + AuthorURL: http://www.sinergise.com/ + - Title: EOS Land Viewer + URL: https://eos.com/landviewer/ + AuthorName: Earth Observing System + AuthorURL: https://eos.com/ + - Title: EO Browser + URL: http://apps.sentinel-hub.com/eo-browser/ + AuthorName: Sinergise + AuthorURL: http://www.sinergise.com/ + Publications: \ No newline at end of file diff --git a/datasets/sentinel-2.yaml b/datasets/sentinel-2.yaml index 6d3d03dd3..4db91882e 100644 --- a/datasets/sentinel-2.yaml +++ b/datasets/sentinel-2.yaml @@ -54,65 +54,68 @@ Resources: Region: eu-central-1 Type: SNS Topic DataAtWork: - - Title: Sentinel Hub WMS/WMTS/WCS Service - URL: http://www.sentinel-hub.com/apps/wms - AuthorName: Sinergise - AuthorURL: http://www.sinergise.com/ - - Title: Satellite Search by Remote Pixel - URL: https://remotepixel.ca/projects/satellitesearch.html - AuthorName: Remote Pixel - AuthorURL: https://remotepixel.ca/ - - Title: EOS Land Viewer - URL: https://eos.com/landviewer/ - AuthorName: Earth Observing System - AuthorURL: https://eos.com/ - - Title: Sentinel-2 Cloudless Atlas - URL: https://s2maps.eu/ - AuthorName: EOX - AuthorURL: https://eox.at - - Title: EO Browser - URL: http://apps.sentinel-hub.com/eo-browser/ - AuthorName: Sinergise - AuthorURL: http://www.sinergise.com/ - - Title: Sentinel Playground - URL: http://apps.sentinel-hub.com/sentinel-playground/ - AuthorName: Sinergise - AuthorURL: http://www.sinergise.com/ - - Title: Python package for working with Sentinel-2 AWS data - URL: https://github.com/sentinel-hub/sentinelhub-py - AuthorName: Sinergise - AuthorURL: http://www.sinergise.com/ - - Title: Tutorial for using Sentinel-2 data - URL: https://medium.com/@anttilip/seeing-earth-from-space-from-raw-satellite-data-to-beautiful-high-resolution-images-feb522adfa3f - AuthorName: Antti Lipponen - AuthorURL: https://medium.com/@anttilip - - Title: Sterling Geo Using Sentinel-2 on Amazon Web Services to Create NDVI - URL: https://www.youtube.com/watch?v=3tIIUr-keps - AuthorName: Sterling Geo - - Title: FME Landsat-8/Sentinel-2 File Selector - URL: http://demos.fmeserver.com/landsat-sentinel-selector/ - AuthorName: Safe Software - AuthorURL: https://www.safe.com/ - - Title: Exploring the Chile wildfires with Landsat and Sentinel-2 imagery - URL: https://www.gearthblog.com/blog/archives/2017/02/exploring-chile-wildfires-landsat-sentinel-2-imagery.html - AuthorName: Timothy Whitehead - - Title: Using Vector tiles and AWS Lambda, we can build a really simple API to get Landsat and Sentinel images - URL: https://remotepixel.ca/blog/searchapi_20171211.html - AuthorName: Remote Pixel - AuthorURL: https://remotepixel.ca/ - - Title: QGIS plugin for Sentinel-2 data - URL: https://medium.com/sentinel-hub/control-sentinel-hub-from-within-qgis-2a83eb7f13db - AuthorName: Sinergise - AuthorURL: http://www.sinergise.com/ - - Title: Spectator - tracking Sentinel 2, accessing the data and quick preview - URL: https://spectator.earth/ - AuthorName: Spectator - AuthorURL: https://spectator.earth/ - - Title: Use the Sentinel Explorer app to explore, visualize, and analyze the entire Sentinel-2 archive - URL: https://sentinel2explorer.esri.com/ - AuthorName: Esri - AuthorURL: https://www.esri.com/en-us/home - - Title: Integrate imagery from the Sentinel-2 archive into your own apps, maps, and analysis with the Sentinel-2 image service - URL: https://www.esri.com/arcgis-blog/products/arcgis-living-atlas/imagery/sentinel-2-more-than-meets-the-eye/ - AuthorName: Esri - AuthorURL: https://www.esri.com/en-us/home + Tutorials: + - Title: Tutorial for using Sentinel-2 data + URL: https://medium.com/@anttilip/seeing-earth-from-space-from-raw-satellite-data-to-beautiful-high-resolution-images-feb522adfa3f + AuthorName: Antti Lipponen + AuthorURL: https://medium.com/@anttilip + - Title: Exploring the Chile wildfires with Landsat and Sentinel-2 imagery + URL: https://www.gearthblog.com/blog/archives/2017/02/exploring-chile-wildfires-landsat-sentinel-2-imagery.html + AuthorName: Timothy Whitehead + - Title: Using Vector tiles and AWS Lambda, we can build a really simple API to get Landsat and Sentinel images + URL: https://remotepixel.ca/blog/searchapi_20171211.html + AuthorName: Remote Pixel + AuthorURL: https://remotepixel.ca/ + - Title: Integrate imagery from the Sentinel-2 archive into your own apps, maps, and analysis with the Sentinel-2 image service + URL: https://www.esri.com/arcgis-blog/products/arcgis-living-atlas/imagery/sentinel-2-more-than-meets-the-eye/ + AuthorName: Esri + AuthorURL: https://www.esri.com/en-us/home + Tools & Applications: + - Title: Sentinel Hub WMS/WMTS/WCS Service + URL: http://www.sentinel-hub.com/apps/wms + AuthorName: Sinergise + AuthorURL: http://www.sinergise.com/ + - Title: Satellite Search by Remote Pixel + URL: https://remotepixel.ca/projects/satellitesearch.html + AuthorName: Remote Pixel + AuthorURL: https://remotepixel.ca/ + - Title: EOS Land Viewer + URL: https://eos.com/landviewer/ + AuthorName: Earth Observing System + AuthorURL: https://eos.com/ + - Title: Sentinel-2 Cloudless Atlas + URL: https://s2maps.eu/ + AuthorName: EOX + AuthorURL: https://eox.at + - Title: EO Browser + URL: http://apps.sentinel-hub.com/eo-browser/ + AuthorName: Sinergise + AuthorURL: http://www.sinergise.com/ + - Title: Sentinel Playground + URL: http://apps.sentinel-hub.com/sentinel-playground/ + AuthorName: Sinergise + AuthorURL: http://www.sinergise.com/ + - Title: Python package for working with Sentinel-2 AWS data + URL: https://github.com/sentinel-hub/sentinelhub-py + AuthorName: Sinergise + AuthorURL: http://www.sinergise.com/ + - Title: Sterling Geo Using Sentinel-2 on Amazon Web Services to Create NDVI + URL: https://www.youtube.com/watch?v=3tIIUr-keps + AuthorName: Sterling Geo + - Title: FME Landsat-8/Sentinel-2 File Selector + URL: http://demos.fmeserver.com/landsat-sentinel-selector/ + AuthorName: Safe Software + AuthorURL: https://www.safe.com/ + - Title: QGIS plugin for Sentinel-2 data + URL: https://medium.com/sentinel-hub/control-sentinel-hub-from-within-qgis-2a83eb7f13db + AuthorName: Sinergise + AuthorURL: http://www.sinergise.com/ + - Title: Spectator - tracking Sentinel 2, accessing the data and quick preview + URL: https://spectator.earth/ + AuthorName: Spectator + AuthorURL: https://spectator.earth/ + - Title: Use the Sentinel Explorer app to explore, visualize, and analyze the entire Sentinel-2 archive + URL: https://sentinel2explorer.esri.com/ + AuthorName: Esri + AuthorURL: https://www.esri.com/en-us/home + Publications: \ No newline at end of file diff --git a/datasets/sentinel1-slc-seasia-pds.yaml b/datasets/sentinel1-slc-seasia-pds.yaml index 7e39c0f4f..31fff8b79 100644 --- a/datasets/sentinel1-slc-seasia-pds.yaml +++ b/datasets/sentinel1-slc-seasia-pds.yaml @@ -21,7 +21,10 @@ Resources: Region: ap-southeast-1 Type: S3 Bucket DataAtWork: + Tutorials: - Title: Sentinel-1 Opendataset Wiki and Tutorials URL: https://github.com/earthobservatory/sentinel1-opds/wiki AuthorName: Earth Observatory of Singapore AuthorURL: https://earthobservatory.sg/research-group/geodesy-group-emma-hill/people + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/silo.yaml b/datasets/silo.yaml index 18eb31ee2..92acbd00f 100644 --- a/datasets/silo.yaml +++ b/datasets/silo.yaml @@ -16,20 +16,23 @@ Tags: - sustainability - water - weather -License: | +License: | SILO datasets are constructed by the [Queensland Government](http://www.qld.gov.au/) using observational data provided by the [Australian Bureau of Meteorology](http://www.bom.gov.au/) and are available under the [Creative Commons Attribution 4.0](https://creativecommons.org/licenses/by/4.0/) license. -Resources: +Resources: - Description: SILO open data ARN: arn:aws:s3:::silo-open-data Region: ap-southeast-2 Type: S3 Bucket DataAtWork: - - Title: Python script to calculate a regional mean - URL: https://www.longpaddock.qld.gov.au/silo/gridded-data/python - AuthorName: SILO - - Title: NetCDF Operators to calculate seasonal means - URL: https://www.longpaddock.qld.gov.au/silo/gridded-data/nco - AuthorName: SILO - - Title: Convert NetCDF to ESRI ArcASCII or GeoTIFF - URL: https://www.longpaddock.qld.gov.au/silo/gridded-data/conversion - AuthorName: SILO + Tutorials: + Tools & Applications: + - Title: Python script to calculate a regional mean + URL: https://www.longpaddock.qld.gov.au/silo/gridded-data/python + AuthorName: SILO + - Title: NetCDF Operators to calculate seasonal means + URL: https://www.longpaddock.qld.gov.au/silo/gridded-data/nco + AuthorName: SILO + - Title: Convert NetCDF to ESRI ArcASCII or GeoTIFF + URL: https://www.longpaddock.qld.gov.au/silo/gridded-data/conversion + AuthorName: SILO + Publications: \ No newline at end of file diff --git a/datasets/software-heritage.yaml b/datasets/software-heritage.yaml index e6a9d9028..cd56dd31b 100644 --- a/datasets/software-heritage.yaml +++ b/datasets/software-heritage.yaml @@ -35,3 +35,7 @@ Resources: ARN: arn:aws:s3:::softwareheritage Region: us-east-1 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/spacenet.yaml b/datasets/spacenet.yaml index a234d0ed5..a90ee3be7 100644 --- a/datasets/spacenet.yaml +++ b/datasets/spacenet.yaml @@ -23,30 +23,33 @@ Resources: Region: us-east-1 Type: S3 Bucket DataAtWork: - - Title: Getting Started with SpaceNet Data - URL: https://medium.com/the-downlinq/getting-started-with-spacenet-data-827fd2ec9f53 - AuthorName: Adam Van Etten - AuthorURL: https://medium.com/@avanetten - - Title: Introducing the SpaceNet Road Detection and Routing Challenge and Dataset - URL: https://medium.com/the-downlinq/introducing-the-spacenet-road-detection-and-routing-challenge-and-dataset-7604de39b779 - AuthorName: David Lindenbaum - AuthorURL: https://medium.com/@david.lindenbaum - - Title: 2nd SpaceNet Competition Winners Code Release - URL: https://medium.com/the-downlinq/2nd-spacenet-competition-winners-code-release-c7473eea7c11 - AuthorName: David Lindenbaum - AuthorURL: https://medium.com/@david.lindenbaum - - Title: Building Extraction with YOLT2 and SpaceNet Data - URL: https://medium.com/the-downlinq/building-extraction-with-yolt2-and-spacenet-data-a926f9ffac4f - AuthorName: Adam Van Etten - AuthorURL: https://medium.com/@avanetten - - Title: "SpaceNet: Winning Implementations and New Imagery Release" - URL: https://medium.com/the-downlinq/spacenet-winning-implementations-and-new-imagery-release-55f738e14253 - AuthorName: Todd Stavish - AuthorURL: https://medium.com/@toddstavish - - Title: Solving SpaceNet Road Detection Challenge With Deep Learning - URL: https://devblogs.nvidia.com/solving-spacenet-road-detection-challenge-deep-learning/ - AuthorName: Jonathan Howe, May Casterline and Abel Brown - AuthorURL: https://devblogs.nvidia.com/author/jonathan-howe/, https://devblogs.nvidia.com/author/may-casterline/, https://devblogs.nvidia.com/author/abel-brown/ - - Title: "Solaris: an open source Python library for analyzing overhead imagery with machine learning" - URL: https://medium.com/the-downlinq/announcing-solaris-an-open-source-python-library-for-analyzing-overhead-imagery-with-machine-48c1489c29f7 - AuthorName: Nick Weir + Tutorials: + - Title: Getting Started with SpaceNet Data + URL: https://medium.com/the-downlinq/getting-started-with-spacenet-data-827fd2ec9f53 + AuthorName: Adam Van Etten + AuthorURL: https://medium.com/@avanetten + Tools & Applications: + - Title: "Solaris: an open source Python library for analyzing overhead imagery with machine learning" + URL: https://medium.com/the-downlinq/announcing-solaris-an-open-source-python-library-for-analyzing-overhead-imagery-with-machine-48c1489c29f7 + AuthorName: Nick Weir + Publications: + - Title: Introducing the SpaceNet Road Detection and Routing Challenge and Dataset + URL: https://medium.com/the-downlinq/introducing-the-spacenet-road-detection-and-routing-challenge-and-dataset-7604de39b779 + AuthorName: David Lindenbaum + AuthorURL: https://medium.com/@david.lindenbaum + - Title: 2nd SpaceNet Competition Winners Code Release + URL: https://medium.com/the-downlinq/2nd-spacenet-competition-winners-code-release-c7473eea7c11 + AuthorName: David Lindenbaum + AuthorURL: https://medium.com/@david.lindenbaum + - Title: Building Extraction with YOLT2 and SpaceNet Data + URL: https://medium.com/the-downlinq/building-extraction-with-yolt2-and-spacenet-data-a926f9ffac4f + AuthorName: Adam Van Etten + AuthorURL: https://medium.com/@avanetten + - Title: "SpaceNet: Winning Implementations and New Imagery Release" + URL: https://medium.com/the-downlinq/spacenet-winning-implementations-and-new-imagery-release-55f738e14253 + AuthorName: Todd Stavish + AuthorURL: https://medium.com/@toddstavish + - Title: Solving SpaceNet Road Detection Challenge With Deep Learning + URL: https://devblogs.nvidia.com/solving-spacenet-road-detection-challenge-deep-learning/ + AuthorName: Jonathan Howe, May Casterline and Abel Brown + AuthorURL: https://devblogs.nvidia.com/author/jonathan-howe/, https://devblogs.nvidia.com/author/may-casterline/, https://devblogs.nvidia.com/author/abel-brown/ diff --git a/datasets/tabula-muris.yaml b/datasets/tabula-muris.yaml index 402f469b0..eb3689905 100644 --- a/datasets/tabula-muris.yaml +++ b/datasets/tabula-muris.yaml @@ -20,3 +20,7 @@ Resources: ARN: arn:aws:s3:::czb-tabula-muris Region: us-east-1 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/tcga.yaml b/datasets/tcga.yaml index bda80443b..a1fc2c531 100644 --- a/datasets/tcga.yaml +++ b/datasets/tcga.yaml @@ -15,6 +15,9 @@ Resources: Region: us-east-1 Type: S3 Bucket DataAtWork: + Tutorials: - Title: Building High-Throughput Genomics Batch Workflows on AWS URL: https://aws.amazon.com/blogs/apn/getting-to-know-our-apn-genomics-partners/ - AuthorName: Aaron Friedman \ No newline at end of file + AuthorName: Aaron Friedman + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/terrain-tiles.yaml b/datasets/terrain-tiles.yaml index 682fb1d94..46b9715b2 100644 --- a/datasets/terrain-tiles.yaml +++ b/datasets/terrain-tiles.yaml @@ -17,39 +17,42 @@ Resources: Region: us-east-1 Type: S3 Bucket DataAtWork: - - Title: R package for accessing Terrain Tiles - URL: https://cran.r-project.org/web/packages/elevatr/vignettes/introduction_to_elevatr.html - AuthorName: Jeffrey W. Hollister - AuthorURL: https://github.com/jhollist - - Title: Mapzen Terrain Tiles on AWS Reader - URL: https://docs.safe.com/fme/html/FME_Desktop_Documentation/FME_ReadersWriters/terraintilesaws/terraintilesaws.htm - AuthorName: Safe Software - AuthorURL: https://www.safe.com/ - - Title: Sentinel Hub WMS/WMTS/WCS Service for DEM - URL: http://www.sentinel-hub.com/apps/wms - AuthorName: Sinergise - AuthorURL: http://www.sinergise.com/ - - Title: Sentinel Playground for DEM - URL: https://apps.sentinel-hub.com/sentinel-playground/?source=DEM&lat=41.902277040963696&lng=-102.83203125&zoom=4 - AuthorName: Sinergise - AuthorURL: http://www.sinergise.com/ - - Title: EOS Land Viewer - URL: https://eos.com/landviewer/ - AuthorName: Earth Observing System - AuthorURL: https://eos.com/ - - Title: Open-Source Elevation Service - URL: https://elevation.racemap.com - AuthorName: Racemap - AuthorURL: https://racemap.com/ - - Title: On The Go Map - URL: https://onthegomap.com/ - AuthorName: On The Go Map - AuthorURL: https://onthegomap.com/ - - Title: "PlanetUtils (GitHub): Scripts and a Docker container to download, merge, and resample terrain tiles" - URL: https://github.com/interline-io/planetutils - AuthorName: Interline Technologies - AuthorURL: https://www.interline.io/ - - Title: "PODPAC: Python Library supporting TerrainTiles for analysis" - URL: https://podpac.org/datasets.html#terraintiles - AuthorName: Creare - AuthorURL: http://www.creare.com/ + Tutorials: + Tools & Applications: + - Title: R package for accessing Terrain Tiles + URL: https://cran.r-project.org/web/packages/elevatr/vignettes/introduction_to_elevatr.html + AuthorName: Jeffrey W. Hollister + AuthorURL: https://github.com/jhollist + - Title: Mapzen Terrain Tiles on AWS Reader + URL: https://docs.safe.com/fme/html/FME_Desktop_Documentation/FME_ReadersWriters/terraintilesaws/terraintilesaws.htm + AuthorName: Safe Software + AuthorURL: https://www.safe.com/ + - Title: Sentinel Hub WMS/WMTS/WCS Service for DEM + URL: http://www.sentinel-hub.com/apps/wms + AuthorName: Sinergise + AuthorURL: http://www.sinergise.com/ + - Title: Sentinel Playground for DEM + URL: https://apps.sentinel-hub.com/sentinel-playground/?source=DEM&lat=41.902277040963696&lng=-102.83203125&zoom=4 + AuthorName: Sinergise + AuthorURL: http://www.sinergise.com/ + - Title: EOS Land Viewer + URL: https://eos.com/landviewer/ + AuthorName: Earth Observing System + AuthorURL: https://eos.com/ + - Title: Open-Source Elevation Service + URL: https://elevation.racemap.com + AuthorName: Racemap + AuthorURL: https://racemap.com/ + - Title: On The Go Map + URL: https://onthegomap.com/ + AuthorName: On The Go Map + AuthorURL: https://onthegomap.com/ + - Title: "PlanetUtils (GitHub): Scripts and a Docker container to download, merge, and resample terrain tiles" + URL: https://github.com/interline-io/planetutils + AuthorName: Interline Technologies + AuthorURL: https://www.interline.io/ + - Title: "PODPAC: Python Library supporting TerrainTiles for analysis" + URL: https://podpac.org/datasets.html#terraintiles + AuthorName: Creare + AuthorURL: http://www.creare.com/ + Publications: diff --git a/datasets/tess.yaml b/datasets/tess.yaml index 3f2fbaa64..c6f4c7ff1 100644 --- a/datasets/tess.yaml +++ b/datasets/tess.yaml @@ -20,7 +20,10 @@ Resources: Region: us-east-1 Type: SNS Topic DataAtWork: - - Title: TESS data available on AWS - URL: https://mast-labs.stsci.io/2018/12/tess-data-available-on-aws - AuthorName: Arfon Smith - AuthorURL: https://twitter.com/arfon + Tutorials: + Tools & Applications: + Publications: + - Title: TESS data available on AWS + URL: https://mast-labs.stsci.io/2018/12/tess-data-available-on-aws + AuthorName: Arfon Smith + AuthorURL: https://twitter.com/arfon diff --git a/datasets/uk-met-office.yaml b/datasets/uk-met-office.yaml index 6a1a22c96..9f801ede6 100644 --- a/datasets/uk-met-office.yaml +++ b/datasets/uk-met-office.yaml @@ -4,11 +4,11 @@ Description: | Met Office atmospheric model data, whilst also experiencing a transformative method of requesting data via Restful APIs on AWS. All ahead of Met Office’s own operationally supported API platform that will be launched in late 2019. - - For information about the data see the [Met Office website](https://www.metoffice.gov.uk/services/data-provision/big-data-drive/wholesale/categories/planetary-scale-applications). - For examples of using the data check out the [examples repository](https://github.com/MetOffice/aws-earth-examples). + + For information about the data see the [Met Office website](https://www.metoffice.gov.uk/services/data/met-office-data-for-reuse/discovery). + For examples of using the data check out the [examples repository](https://github.com/MetOffice/aws-earth-examples). If you need help and support using the data please raise an issue on the examples repository. -Documentation: https://github.com/MetOffice/aws-earth-examples +Documentation: https://github.com/MetOffice/aws-earth-examples Contact: https://www.metoffice.gov.uk/about-us/contact UpdateFrequency: Daily (with 24 hour delay) Tags: @@ -57,4 +57,13 @@ Resources: ARN: arn:aws:sns:eu-west-2:021908831235:aws-earth-mo-atmospheric-mogreps-g-prd Region: eu-west-2 Type: SNS Topic - +DataAtWork: + Tutorials: + - Title: Met Office AWS Earth data - Getting Started + URL: https://github.com/MetOffice/aws-earth-examples/blob/master/examples/1.%20Getting%20Started.ipynb + AuthorName: Jacob Tomlinson + - Title: Met Office AWS Earth data - Subscribing to data + URL: https://github.com/MetOffice/aws-earth-examples/blob/master/examples/2.%20Subscribing%20to%20data.ipynb + AuthorName: Jacob Tomlinson + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/unidata-goes.yaml b/datasets/unidata-goes.yaml index 3d6cdd896..0a6afae48 100644 --- a/datasets/unidata-goes.yaml +++ b/datasets/unidata-goes.yaml @@ -23,3 +23,7 @@ Resources: ARN: arn:aws:sns:us-west-2:492151760762:NewGOES16Object Region: us-west-2 Type: SNS Topic +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/usda-naip.yaml b/datasets/usda-naip.yaml index 50fcc6201..c8cfc14dc 100644 --- a/datasets/usda-naip.yaml +++ b/datasets/usda-naip.yaml @@ -21,7 +21,10 @@ Resources: Type: S3 Bucket RequesterPays: True DataAtWork: - - Title: VoyagerSearch showing off Batch + NAIP - URL: https://www.voyagersearch.com/using-aws-batch-to-generate-image-thumbnails-for-voyager - AuthorName: Voyager - AuthorURL: https://www.voyagersearch.com/ \ No newline at end of file + Tutorials: + Tools & Applications: + - Title: VoyagerSearch showing off Batch + NAIP + URL: https://www.voyagersearch.com/using-aws-batch-to-generate-image-thumbnails-for-voyager + AuthorName: Voyager + AuthorURL: https://www.voyagersearch.com/ + Publications: \ No newline at end of file diff --git a/datasets/usgs-lidar.yaml b/datasets/usgs-lidar.yaml index c20c377fa..043d75677 100644 --- a/datasets/usgs-lidar.yaml +++ b/datasets/usgs-lidar.yaml @@ -23,15 +23,18 @@ Resources: Type: S3 Bucket RequesterPays: True DataAtWork: - - Title: Using Lambda Layers with USGS 3DEP LiDAR Point Clouds - URL: https://github.com/hobu/usgs-lidar/tree/master/lambda - AuthorName: Howard Butler - AuthorURL: https://twitter.com/howardbutler - - Title: WebGL Visualization of USGS 3DEP Lidar Point Clouds with Potree and Plasio.js - URL: https://usgs.entwine.io/ - AuthorName: Connor Manning - AuthorURL: https://twitter.com/csmannin - - Title: USGS 3DEP Lidar Point Cloud Now Available as Amazon Public Dataset - URL: https://www.usgs.gov/news/usgs-3dep-lidar-point-cloud-now-available-amazon-public-dataset - AuthorName: Department of the Interior, U.S. Geological Survey - AuthorURL: https://www.usgs.gov + Tutorials: + - Title: Using Lambda Layers with USGS 3DEP LiDAR Point Clouds + URL: https://github.com/hobu/usgs-lidar/tree/master/lambda + AuthorName: Howard Butler + AuthorURL: https://twitter.com/howardbutler + - Title: WebGL Visualization of USGS 3DEP Lidar Point Clouds with Potree and Plasio.js + URL: https://usgs.entwine.io/ + AuthorName: Connor Manning + AuthorURL: https://twitter.com/csmannin + Tools & Applications: + Publications: + - Title: USGS 3DEP Lidar Point Cloud Now Available as Amazon Public Dataset + URL: https://www.usgs.gov/news/usgs-3dep-lidar-point-cloud-now-available-amazon-public-dataset + AuthorName: Department of the Interior, U.S. Geological Survey + AuthorURL: https://www.usgs.gov diff --git a/datasets/wrf-alaska-snap.yaml b/datasets/wrf-alaska-snap.yaml index c818d5bd6..4cd41e219 100755 --- a/datasets/wrf-alaska-snap.yaml +++ b/datasets/wrf-alaska-snap.yaml @@ -19,3 +19,7 @@ Resources: ARN: arn:aws:s3:::wrf-ak-ar5 Region: us-east-1 Type: S3 Bucket +DataAtWork: + Tutorials: + Tools & Applications: + Publications: \ No newline at end of file diff --git a/datasets/xiph-media.yaml b/datasets/xiph-media.yaml index 91f40d831..6c7cc0076 100644 --- a/datasets/xiph-media.yaml +++ b/datasets/xiph-media.yaml @@ -19,7 +19,10 @@ Resources: Region: us-east-1 Type: S3 Bucket DataAtWork: - - Title: Encoding video with AV1 on EC2 - URL: https://media.xiph.org/aws.html - AuthorName: Thomas Daede - AuthorURL: https://www.xiph.org/ + Tutorials: + - Title: Encoding video with AV1 on EC2 + URL: https://media.xiph.org/aws.html + AuthorName: Thomas Daede + AuthorURL: https://www.xiph.org/ + Tools & Applications: + Publications: diff --git a/datasets/ycb-benchmarks.yaml b/datasets/ycb-benchmarks.yaml index 45958c538..e5667651a 100644 --- a/datasets/ycb-benchmarks.yaml +++ b/datasets/ycb-benchmarks.yaml @@ -12,19 +12,22 @@ Resources: Region: us-east-1 Type: S3 Bucket DataAtWork: - - Title: Pre-touch sensing for sequential manipulation - URL: https://ieeexplore.ieee.org/abstract/document/7989594 - AuthorName: Boling Yang, Patrick Lancaster, Joshua R. Smith - AuthorURL: https://sensor.cs.washington.edu/jrs.html - - Title: "The Closure Signature: A Functional Approach to Model Underactuated Compliant Robotic Hands" - URL: https://ieeexplore.ieee.org/abstract/document/8304743 - AuthorName: Maria Pozzi, Gionata Salvietti, João Bimbo, Monica Malvezzi, Domenico Prattichizzo - AuthorURL: http://www.dii.unisi.it/~domenico/ - - Title: "Label Fusion: A Pipeline for Generating Ground Truth Labels for Real RGBD Data of Cluttered Scenes" - URL: https://ieeexplore.ieee.org/abstract/document/8460950 - AuthorName: Pat Marion, Peter R. Florence, Lucas Manuelli, Russ Tedrake - AuthorURL: https://groups.csail.mit.edu/locomotion/russt.html - - Title: "Benchmarking in Manipulation Research: Using the Yale-CMU-Berkeley Object and Model Set" - URL: https://ieeexplore.ieee.org/document/7254318 - AuthorName: Berk Calli, Aaron Walsman, Arjun Singh, Siddhartha Srinivasa, Pieter Abbeel, Aaron M Dollar - AuthorURL: https://www.wpi.edu/people/faculty/bcalli + Tutorials: + Tools & Applications: + Publications: + - Title: Pre-touch sensing for sequential manipulation + URL: https://ieeexplore.ieee.org/abstract/document/7989594 + AuthorName: Boling Yang, Patrick Lancaster, Joshua R. Smith + AuthorURL: https://sensor.cs.washington.edu/jrs.html + - Title: "The Closure Signature: A Functional Approach to Model Underactuated Compliant Robotic Hands" + URL: https://ieeexplore.ieee.org/abstract/document/8304743 + AuthorName: Maria Pozzi, Gionata Salvietti, João Bimbo, Monica Malvezzi, Domenico Prattichizzo + AuthorURL: http://www.dii.unisi.it/~domenico/ + - Title: "Label Fusion: A Pipeline for Generating Ground Truth Labels for Real RGBD Data of Cluttered Scenes" + URL: https://ieeexplore.ieee.org/abstract/document/8460950 + AuthorName: Pat Marion, Peter R. Florence, Lucas Manuelli, Russ Tedrake + AuthorURL: https://groups.csail.mit.edu/locomotion/russt.html + - Title: "Benchmarking in Manipulation Research: Using the Yale-CMU-Berkeley Object and Model Set" + URL: https://ieeexplore.ieee.org/document/7254318 + AuthorName: Berk Calli, Aaron Walsman, Arjun Singh, Siddhartha Srinivasa, Pieter Abbeel, Aaron M Dollar + AuthorURL: https://www.wpi.edu/people/faculty/bcalli diff --git a/datasets/zinc15.yaml b/datasets/zinc15.yaml index dfafda340..4d5a499f8 100644 --- a/datasets/zinc15.yaml +++ b/datasets/zinc15.yaml @@ -18,7 +18,10 @@ Resources: Type: S3 Bucket RequesterPays: True DataAtWork: - - Title: ZINC Database - URL: http://zinc15.docking.org - AuthorName: John Irwin - AuthorURL: http://irwinlab.compbio.ucsf.edu + Tutorials: + Tools & Applications: + Publications: + - Title: ZINC Database + URL: http://zinc15.docking.org + AuthorName: John Irwin + AuthorURL: http://irwinlab.compbio.ucsf.edu \ No newline at end of file diff --git a/schema.yaml b/schema.yaml index 15dbfda97..ac3c5502f 100644 --- a/schema.yaml +++ b/schema.yaml @@ -59,22 +59,63 @@ mapping: RequesterPays: type: bool DataAtWork: - type: seq + type: map required: False - sequence: - - type: map - mapping: - Title: - type: str - required: True - URL: - type: str - pattern: ^(https?:\/\/)?([\da-z\.-]+)\.([a-z\.]{2,6})(\/.*)*\/?$ - required: True - AuthorName: - type: str - required: True - AuthorURL: - type: str - pattern: ^(https?:\/\/)?([\da-z\.-]+)\.([a-z\.]{2,6})(\/.*)*\/?$ - required: False \ No newline at end of file + mapping: + Tutorials: + type: seq + sequence: + - type: map + mapping: + Title: + type: str + required: True + URL: + type: str + pattern: ^(https?:\/\/)?([\da-z\.-]+)\.([a-z\.]{2,6})(\/.*)*\/?$ + required: True + AuthorName: + type: str + required: True + AuthorURL: + type: str + pattern: ^(https?:\/\/)?([\da-z\.-]+)\.([a-z\.]{2,6})(\/.*)*\/?$ + required: False + Tools & Applications: + type: seq + sequence: + - type: map + mapping: + Title: + type: str + required: True + URL: + type: str + pattern: ^(https?:\/\/)?([\da-z\.-]+)\.([a-z\.]{2,6})(\/.*)*\/?$ + required: True + AuthorName: + type: str + required: True + AuthorURL: + type: str + pattern: ^(https?:\/\/)?([\da-z\.-]+)\.([a-z\.]{2,6})(\/.*)*\/?$ + required: False + Publications: + type: seq + sequence: + - type: map + mapping: + Title: + type: str + required: True + URL: + type: str + pattern: ^(https?:\/\/)?([\da-z\.-]+)\.([a-z\.]{2,6})(\/.*)*\/?$ + required: True + AuthorName: + type: str + required: True + AuthorURL: + type: str + pattern: ^(https?:\/\/)?([\da-z\.-]+)\.([a-z\.]{2,6})(\/.*)*\/?$ + required: False \ No newline at end of file