From d2f8cb854921faaa1a95964a1c82212a53212d9c Mon Sep 17 00:00:00 2001 From: Xiaming Chen Date: Sat, 2 Jan 2016 20:23:00 +0800 Subject: [PATCH] Clean list format --- .travis.yml | 4 +- README.rst | 115 ++++++++++++++++++++++++++-------------------------- 2 files changed, 61 insertions(+), 58 deletions(-) diff --git a/.travis.yml b/.travis.yml index 23b0500..8a16046 100644 --- a/.travis.yml +++ b/.travis.yml @@ -5,4 +5,6 @@ before_script: - gem install awesome_bot script: - site404=www.datawrangling.com,getglue-data.s3.amazonaws.com,archive.org/details/2011-05-calufa-twitter-sql,www.stats4stem.org,lib.stat.cmu.edu - - awesome_bot README.rst --allow-dupe --allow-redirect --white-list $site404,travis,crawdad.cs.dartmouth.edu,data.nasdaq.com,137.189.35.203/WebUI/CatDatabase/catData.html,datamob.org,numbrary.com,www.cmr.osu.edu,wiki.earthdata.nasa.gov \ No newline at end of file + - whtlist=travis,crawdad.cs.dartmouth.edu,data.nasdaq.com,137.189.35.203/WebUI/CatDatabase/catData.html,numbrary.com,www.cmr.osu.edu,wiki.earthdata.nasa.gov,missionlocal.org + - site503=labrosa.ee.columbia.edu/millionsong,datamob.org + - awesome_bot README.rst --allow-dupe --allow-redirect --white-list $site404,$whtlist,$site503 \ No newline at end of file diff --git a/README.rst b/README.rst index ffa9c01..db47ca9 100644 --- a/README.rst +++ b/README.rst @@ -36,7 +36,7 @@ Biology * `MIT Cancer Genomics Data `_ * `NIH Microarray data `_ or `FTP `_ * `OpenSNP genotypes data `_ -* `Pathguid: Protein-Protein Interactions Catalog `_ +* `Pathguid - Protein-Protein Interactions Catalog `_ * `Protein Data Bank `_ * `PubChem Project `_ * `PubGene (now Coremine Medical) `_ @@ -132,20 +132,20 @@ Economics * `American Economic Ass (AEA) `_ * `EconData from UMD `_ +* `Economic Freedom of the World Data `_ +* `Historical MacroEconomc Statistics `_ +* `International Trade Statistics `_ * `Internet Product Code Database `_ -* `OpenCorporates Database of Companies in the World `_ * `Joint External Debt Data Hub `_ +* `Jon Haveman International Trade Data Links `_ +* `OpenCorporates Database of Companies in the World `_ +* `Our World in Data `_ +* `SciencesPo World Trade Gravity Datasets `_ * `The Atlas of Economic Complexity `_ -* `The Observatory of Economic Complexity `_ * `The Center for International Data `_ +* `The Observatory of Economic Complexity `_ * `UN Commodity Trade Statistics `_ * `UN Human Development Reports `_ -* `International Trade Statistics `_ -* `Historical MacroEconomc Statistics `_ -* `SciencesPo World Trade Gravity Datasets `_ -* `Jon Haveman International Trade Data Links `_ -* `Economic Freedom of the World Data `_ -* `Our World in Data `_ Energy @@ -181,9 +181,9 @@ Finance Geology ------- +* `Earth Models `_ * `Smithsonian Institution Global Volcano and Eruption Database `_ * `USGS Earthquake Archives `_ -* `Earth Models `_ GeoSpace/GIS @@ -194,8 +194,10 @@ GeoSpace/GIS * `EOSDIS - NASA's earth observing system data `_ * `Factual Global Location Data `_ * `Geo Spatial Data from ASU `_ +* `Geo Wiki Project - Citizen-driven Environmental Monitoring `_ * `GeoNames Worldwide `_ * `Global Administrative Areas Database (GADM) `_ +* `International Institute for Systems Analysis - GIS Datasets `_ * `Landsat 8 on AWS `_ * `List of all countries in all languages `_ * `Natural Earth - vectors and rasters of the world `_ @@ -205,10 +207,8 @@ GeoSpace/GIS * `TIGER/Line - U.S. boundaries and roads `_ * `TwoFishes - Foursquare's coarse geocoder `_ * `TZ Timezones shapfiles `_ -* `World countries in multiple formats `_ -* `International Institute for Systems Analysis - GIS Datasets `_ -* `Geo Wiki Project - Citizen-driven Environmental Monitoring `_ * `UN Environmental Data `_ +* `World countries in multiple formats `_ Government @@ -216,8 +216,8 @@ Government * `Alberta, Province of Canada `_ * `Antwerp, Belgium `_ -* `Argentina `_ * `Argentina (non official) `_ +* `Argentina `_ * `Austin, TX, US `_ * `Australia (abs.gov.au) `_ * `Australia (data.gov.au) `_ @@ -231,6 +231,7 @@ Government * `Canada `_ * `Chicago `_ * `Dallas Open Data `_ +* `DataBC - data from the Province of British Columbia `_ * `Denver Open Data `_ * `Durham, NC Open Data `_ * `Edmonton, AB, Canada `_ @@ -251,8 +252,8 @@ Government * `Indian Government Data `_ * `Indonesian Data Portal `_ * `Laval, QC, Canada `_ -* `London, ON, Canada `_ * `London Datastore, UK `_ +* `London, ON, Canada `_ * `Los Angeles Open Data `_ * `MassGIS, Massachusetts, U.S. `_ * `Mexico `_ @@ -302,7 +303,6 @@ Government * `Uruguay `_ * `Vancouver, BC Open Data Catalog `_ * `Victoria, BC, Canada `_ -* `DataBC - data from the Province of British Columbia `_ Healthcare @@ -332,16 +332,11 @@ Image Processing * `Indoor Scene Recognition `_ * `International Affective Picture System, UFL `_ * `Massive Visual Memory Stimuli, MIT `_ +* `Several Shape-from-Silhouette Datasets `_ * `Stanford Dogs Dataset `_ * `SUN database, MIT `_ * `The Oxford-IIIT Pet Dataset `_ * `YouTube Faces Database `_ -* `Several Shape-from-Silhouette Datasets `_ - -Legal ----------------- - -* `Canadian Legal Information Institute `_ Machine Learning @@ -367,13 +362,13 @@ Machine Learning Museums ------- +* `Canada Science and Technology Museums Corporation's Open Data `_ * `Cooper-Hewitt's Collection Database `_ * `Minneapolis Institute of Arts metadata `_ * `Natural History Museum (London) Data Portal `_ * `Rijksmuseum Historical Art Collection `_ * `Tate Collection metadata `_ * `The Getty vocabularies `_ -* `Canada Science and Technology Museums Corporation's Open Data `_ Natural Language @@ -409,7 +404,7 @@ Physics Psychology/Cognition --------------- +-------------------- * `OSU Cognitive Modeling Repository Datasets `_ @@ -449,69 +444,77 @@ Search Engines * `DataMarket (Qlik) `_ * `Harvard Dataverse Network of scientific data `_ * `ICPSR (UMICH) `_ -* `Open Data Certificates (beta) `_ -* `Statista.com - statistics and Studies `_ * `Institute of Education Sciences `_ -* `National Technical Reports Library `_ +* `National Technical Reports Library `_ +* `Open Data Certificates (beta) `_ +* `OpenDataNetwork - A search engine of all Socrata powered data portals `_ +* `Statista.com - statistics and Studies `_ +* `Zenodo - An open dependable home for the long-tail of science `_ -Social Sciences +Social Networks --------------- -* `72 hours #gamergate scrape `_ +* `72 hours #gamergate Twitter Scrape `_ * `Ancestry.com Forum Dataset over 10 years `_ * `Cheng-Caverlee-Lee September 2009 - January 2010 Twitter Scrape `_ * `CMU Enron Email of 150 users `_ * `EDRM Enron EMail of 151 users, hosted on S3 `_ * `Facebook Data Scrape (2005) `_ * `Facebook Social Networks from LAW (since 2007) `_ -* `FBI Hate Crime 2013 - aggregated data `_ * `Foursquare from UMN/Sarwat (2013) `_ -* `GDELT Global Events Database `_ -* `General Social Survey (GSS) since 1972 `_ * `GetGlue - users rating TV shows `_ * `GitHub Collaboration Archive `_ * `Google Scholar citation relations `_ -* `MIT Reality Mining Dataset `_ * `Mobile Social Networks from UMASS `_ * `Network Twitter Data `_ -* `PewResearch Internet Survey Project `_ -* `PewResearch Society Data Collection `_ -* `Political Polarity Data `_ * `Reddit Comments `_ * `Skytrax' Air Travel Reviews Dataset `_ * `Social Twitter Data `_ * `SourceForge.net Research Data `_ -* `StackExchange Data Explorer `_ -* `Texas Inmates Executed Since 1984 `_ -* `Titanic Survival Data Set `_ * `Twitter Data for Sentiment Analysis `_ * `Twitter Graph of entire Twitter site `_ * `Twitter Scrape Calufa May 2011 `_ -* `UCB's Archive of Social Science Data (D-Lab) `_ -* `UCLA Social Sciences Data Archive `_ * `UNIMI/LAW Social Network Datasets `_ -* `Universities Worldwide `_ -* `UPJOHN for Labor Employment Research `_ * `Yahoo! Graph and Social Data `_ * `Youtube Video Social Graph in 2007,2008 `_ + + +Social Sciences +--------------- + +* `Canadian Legal Information Institute `_ +* `Center for Systemic Peace Datasets - Conflict Trends, Polities, State Fragility, etc `_ * `Correlates of War Project `_ -* `The MacroData Guide by Norsk samfunnsvitenskapelig datatjeneste `_ * `Cryptome Conspiracy Theory Items `_ * `Datacards `_ +* `European Social Survey `_ +* `FBI Hate Crime 2013 - aggregated data `_ +* `GDELT Global Events Database `_ +* `General Social Survey (GSS) since 1972 `_ +* `General Social Survey `_ +* `German Social Survey `_ * `Global Religious Futures Project `_ * `Institute for Demographic Studies `_ -* `UN Civil Society Database `_ -* `Terrorism Research and Analysis Consortium `_ -* `Center for Systemic Peace Datasets - Conflict Trends, Polities, State Fragility, etc `_ * `International Networks Archive `_ -* `Paul Hensel General International Data Page `_ -* `James McGuire Cross National Data `_ -* `International Studies Compendium Project `_ -* `European Social Survey `_ -* `General Social Survey `_ * `International Social Survey Program ISSP `_ -* `German Social Survey `_ +* `International Studies Compendium Project `_ +* `James McGuire Cross National Data `_ +* `MIT Reality Mining Dataset `_ +* `Paul Hensel General International Data Page `_ +* `PewResearch Internet Survey Project `_ +* `PewResearch Society Data Collection `_ +* `Political Polarity Data `_ +* `StackExchange Data Explorer `_ +* `Terrorism Research and Analysis Consortium `_ +* `Texas Inmates Executed Since 1984 `_ +* `The MacroData Guide by Norsk samfunnsvitenskapelig datatjeneste `_ +* `Titanic Survival Data Set `_ +* `UCB's Archive of Social Science Data (D-Lab) `_ +* `UCLA Social Sciences Data Archive `_ +* `UN Civil Society Database `_ +* `Universities Worldwide `_ +* `UPJOHN for Labor Employment Research `_ Sports @@ -528,11 +531,11 @@ Sports Time Series ----------- +* `Databanks International Cross National Time Series Data Archive `_ * `Hard Drive Failure Rates `_ * `Heart Rate Time Series from MIT `_ * `Time Series Data Library (TSDL) from MU `_ * `UC Riverside Time Series Dataset `_ -* `Databanks International Cross National Time Series Data Archive `_ Transportation @@ -564,13 +567,11 @@ Transportation Complementary Collections ------------------------- +* `Database of Scientific Code Contributions `_ * DataWrangling: `Some Datasets Available on the Web `_ * Inside-r: `Finding Data on the Internet `_ * OpenDataMonitor: `An overview of available open data resources in Europe `_ -* OpenDataNetwork: `A search engine of all Socrata powered data portals ranging from small cities to federal agencies and non-profits `_ * Quora: `Where can I find large datasets open to the public? `_ * RS.io: `100+ Interesting Data Sets for Statistics `_ * StaTrek: `Leveraging open data to understand urban lives `_ -* Zenodo: `An open dependable home for the long-tail of science, enabling researchers to share and preserve any research outputs in any size, any format and from any science. `_ -* `Database of Scientific Code Contributions `_