diff --git a/README.md b/README.md index ce0927b..2003f5b 100644 --- a/README.md +++ b/README.md @@ -74,6 +74,23 @@ mlmRev|guImmun|Immunization in Guatemala|2159|13 mlmRev|guPrenat|Prenatal care in Guatemala|2449|15 mlmRev|star|Student Teacher Achievement Ratio (STAR) project data|26796|18 +# How to add datasets from a new package + +**Step 1: add the data from the package** + + 1. In your clone of this repo `mkdir -p data/$PKG` + 2. Go to CRAN + 3. Download the *source package* + 4. Extract one or more of the datasets in the `data` directory into the new directory + +**Step 2: add the metadata** + +Run the script: + + $ scripts/update_doc_one.sh $PKG + +Now it's ready for you to submit your pull request. + # Licensing and Intellectual Property Following Vincent's lead, we have assumed that all of the data sets in this repository can be made available under the GPL-3 license. If you know that one of the datasets released here should not be released publicly or if you know that a data set can only be released under a different license, please contact me so that I can remove the data set from this repository. diff --git a/doc/datasets.csv b/doc/datasets.csv index b8081be..8de3ed7 100644 --- a/doc/datasets.csv +++ b/doc/datasets.csv @@ -506,6 +506,36 @@ "datasets","volcano","Topographic Information on Auckland's Maunga Whau Volcano",87,61 "datasets","warpbreaks","The Number of Breaks in Yarn during Weaving",54,3 "datasets","women","Average Heights and Weights for American Women",15,2 +"gamair","aral","aral",488,4 +"gamair","aral.bnd","aral.bnd",107,3 +"gamair","bird","bird",25100,7 +"gamair","blowfly","blowfly",180,3 +"gamair","bone","bone",23,4 +"gamair","brain","brain",1567,6 +"gamair","cairo","cairo",3780,7 +"gamair","chicago","chicago",5114,8 +"gamair","chl","chl",13840,7 +"gamair","co2s","co2s",507,4 +"gamair","coast","coast",2091,3 +"gamair","engine","engine",19,3 +"gamair","gas","gas",60,804 +"gamair","harrier","harrier",37,3 +"gamair","hubble","hubble",24,4 +"gamair","ipo","ipo",156,7 +"gamair","mack","mack",634,17 +"gamair","mackp","mackp",1162,9 +"gamair","med","med",1476,25 +"gamair","meh","meh",1476,24 +"gamair","mpg","mpg",205,27 +"gamair","prostate","prostate",654,530 +"gamair","sitka","sitka",1027,6 +"gamair","sole","sole",1575,8 +"gamair","sperm.comp1","sperm.comp1",15,5 +"gamair","sperm.comp2","sperm.comp2",24,11 +"gamair","stomata","stomata",24,4 +"gamair","swer","swer",2196,10 +"gamair","wesdr","wesdr",669,5 +"gamair","wine","wine",47,8 "gap","PD","A study of Parkinson's disease and APOE, LRRK2, SNCA makers",825,22 "gap","aldh2","ALDH2 markers and Alcoholism",263,18 "gap","apoeapoc","APOE/APOC1 markers and Alzheimer's",353,8 @@ -732,33 +762,3 @@ "vcd","VonBort","Von Bortkiewicz Horse Kicks Data",280,4 "vcd","WeldonDice","Weldon's Dice Data",11,2 "vcd","WomenQueue","Women in Queues",11,2 -"gamair","aral.bnd","aral.bnd",107,3 -"gamair","aral","aral",488,4 -"gamair","bird","bird",25100,7 -"gamair","blowfly","blowfly",180,3 -"gamair","bone","bone",23,4 -"gamair","brain","brain",1567,6 -"gamair","cairo","cairo",3780,7 -"gamair","chicago","chicago",5114,8 -"gamair","chl","chl",13840,7 -"gamair","co2s","co2s",507,4 -"gamair","coast","coast",2091,3 -"gamair","engine","engine",19,3 -"gamair","gas","gas",60,804 -"gamair","harrier","harrier",37,3 -"gamair","hubble","hubble",24,4 -"gamair","ipo","ipo",156,7 -"gamair","mack","mack",634,17 -"gamair","mackp","mackp",1162,9 -"gamair","med","med",1476,25 -"gamair","meh","meh",1476,24 -"gamair","mpg","mpg",205,27 -"gamair","prostate","prostate",654,530 -"gamair","sitka","sitka",1027,6 -"gamair","sole","sole",1575,8 -"gamair","sperm.comp1","sperm.comp1",15,5 -"gamair","sperm.comp2","sperm.comp2",24,11 -"gamair","stomata","stomata",24,4 -"gamair","swer","swer",2196,10 -"gamair","wesdr","wesdr",669,5 -"gamair","wine","wine",47,8 diff --git a/scripts/update_doc_all.sh b/scripts/update_doc_all.sh new file mode 100755 index 0000000..0d8ff1a --- /dev/null +++ b/scripts/update_doc_all.sh @@ -0,0 +1,4 @@ +R --no-save < 0) @@ -114,7 +161,7 @@ update_docs <- function(pkg_dir) { } write <- function(df, fn) { - write.table(df, file = fn, sep = ",", qmethod = "escape", row.names = FALSE) + write.table(df, file = fn, sep = ",", qmethod = "double", row.names = FALSE) } clean <- function(df) {