Browse Source

initial commit

pull/4/head
Bob Rudis 9 years ago
commit
f1d982ea95
  1. 4
      .Rbuildignore
  2. 7
      .gitignore
  3. 23
      .travis.yml
  4. 18
      DESCRIPTION
  5. 2
      LICENSE
  6. 4
      NAMESPACE
  7. 6
      R/cdcfluview-package.R
  8. 87
      R/cdcfluview.R
  9. 67
      README.Rmd
  10. 83
      README.md
  11. BIN
      README_files/figure-markdown_github/unnamed-chunk-4-1.png
  12. 21
      cdcfluview.Rproj
  13. 14
      man/cdcfluview.Rd
  14. 36
      man/get_flu_data.Rd
  15. 2
      tests/test-all.R
  16. 6
      tests/testthat/test-cdcfluview.R

4
.Rbuildignore

@ -0,0 +1,4 @@
^.*\.Rproj$
^\.Rproj\.user$
^\.travis\.yml$
^.*md$

7
.gitignore

@ -0,0 +1,7 @@
.Rproj.user
.Rhistory
.RData
.Rproj
src/*.o
src/*.so
src/*.dll

23
.travis.yml

@ -0,0 +1,23 @@
language: c
before_install:
- curl -OL http://raw.github.com/craigcitro/r-travis/master/scripts/travis-tool.sh
- chmod 755 ./travis-tool.sh
- ./travis-tool.sh bootstrap
install:
- ./travis-tool.sh install_github plyr
- ./travis-tool.sh install_deps
script: ./travis-tool.sh run_tests
on_failure:
- ./travis-tool.sh dump_logs
branches:
except:
- /-expt$/
notifications:
email:
on_success: change
on_failure: change

18
DESCRIPTION

@ -0,0 +1,18 @@
Package: cdcfluview
Type: Package
Title: cdcfluview is package that retrieves the data behind the CDC's FluView portal
Version: 0.1
Date: 2015-01-10
Author: Bob Rudis (@hrbrmstr)
Maintainer: Bob Rudis <bob@rudis.net>
Description: The CDC's FluView is a Flash portal and the only way to get flu season
data is to use GUI controls, making it tedious to retrieve updates. This package
uses the same API the portal does to programmatically retrieve data.
URL: http://github.com/hrbrmstr/cdcfluview
BugReports: https://github.com/hrbrmstr/cdcfluview/issues
License: MIT + file LICENSE
Suggests:
testthat
Depends:
R (>= 3.0.0),
httr (>= 0.3.0)

2
LICENSE

@ -0,0 +1,2 @@
YEAR: 2015
COPYRIGHT HOLDER: Bob Rudis

4
NAMESPACE

@ -0,0 +1,4 @@
# Generated by roxygen2 (4.1.0): do not edit by hand
export(get_flu_data)
import(httr)

6
R/cdcfluview-package.R

@ -0,0 +1,6 @@
#' A package to retrive data behind the CDC FluView portal
#' @name cdcfluview
#' @docType package
#' @author Bob Rudis (@@hrbrmstr)
#' @import httr
NULL

87
R/cdcfluview.R

@ -0,0 +1,87 @@
# http://gis.cdc.gov/grasp/fluview/fluportaldashboard.html
#' Retrieve CDC flu data
#'
#' Uses the data source from the CDC FluView \url{http://gis.cdc.gov/grasp/fluview/fluportaldashboard.html}
#' and provides flu reporting data as either a single data frame or a list
#' of data frames (depending on whether either WHO NREVSS or ILINet - or both - is chosen)
#'
#' @param region one of "\code{hhs}", "\code{census}", "\code{national}"
#' @param sub_region depends on the \code{region_type}.\cr
#' For "\code{national}", the \code{sub_region} should be \code{NA}.\cr
#' For "\code{hhs}", should be a vector between \code{1:10}.\cr
#' For "\code{census}", should be a vector between \code{1:9}
#' @param data_source either of "\code{who}" (for WHO NREVSS) or "\code{ilinet}" or "\code{all}" (for both)
#' @param years a vector of years to retrieve data for (i.e. \code{2014} for CDC flu seasn 2014-2015)
#' @return If only a single \code{data_source} is specified, then a single \code{data.frame} is
#' returned, otherwise a named list with each \code{data.frame} is returned.
#' @export
#' @examples \dontrun{
#' flu <- get_flu_data("hhs", 1:10, c("who", "ilinet"), years=2000:2014)
#' }
get_flu_data <- function(region="hhs", sub_region=1:10,
data_source="ilinet", years=2014) {
region <- tolower(region)
data_source <- tolower(data_source)
if (!(region %in% c("hhs", "census", "national")))
stop("Error: region must be one of hhs, census or national")
if (length(region) != 1)
stop("Error: can only select one region")
if (region=="national") sub_region = ""
if ((region=="hhs") && !all(sub_region %in% 1:10))
stop("Error: sub_region values must fall between 1:10 when region is 'hhs'")
if ((region=="census") && !all(sub_region %in% 1:19))
stop("Error: sub_region values must fall between 1:10 when region is 'census'")
if (!all(data_source %in% c("who", "ilinet")))
stop("Error: data_source must be either 'who', 'ilinet' or both")
if (any(years < 1997))
stop("Error: years should be > 1997")
years <- years - 1960
reg <- as.numeric(c("hhs"=1, "census"=2, "national"=3)[[region]])
data_source <- gsub("who", "WHO_NREVSS", data_source)
data_source <- gsub("ilinet", "ILINet", data_source)
params <- list(SubRegionsList=sub_region,
DataSources=data_source,
RegionID=reg,
SeasonsList=years)
out_file <- tempfile(fileext=".zip")
tmp <- POST("http://gis.cdc.gov/grasp/fluview/FluViewPhase2CustomDownload.ashx",
body=params,
write_disk(out_file))
stop_for_status(tmp)
if (!(file.exists(out_file)))
stop("Error: cannot process downloaded data")
out_dir <- tempdir()
files <- unzip(out_file, exdir=out_dir, overwrite=TRUE)
file_list <- lapply(files, function(x) {
ct <- ifelse(grepl("who", x, ignore.case=TRUE), 0, 1)
read.csv(x, header=TRUE, skip=ct, stringsAsFactors=FALSE)
})
names(file_list) <- substr(basename(files), 1, 3)
if (length(file_list) == 1) {
return(file_list[[1]])
} else {
return(file_list)
}
}

67
README.Rmd

@ -0,0 +1,67 @@
---
title: "README"
author: "Bob Rudis"
date: January 10, 2015
output:
md_document:
variant: markdown_github
---
The CDC's FluView is a Flash portal and the only way to get flu season
data is to use GUI controls, making it tedious to retrieve updates. This package
uses the same API the portal does to programmatically retrieve data.
The following functions are implemented:
- `get_flu_data` : retrieve flu data
The following data sets are included:
### News
- Version 0.1 released
### Installation
```{r eval=FALSE}
devtools::install_github("hrbrmstr/cdcfluview")
```
```{r echo=FALSE, message=FALSE, warning=FALSE, error=FALSE}
options(width=120)
```
### Usage
```{r}
library(cdcfluview)
library(ggplot2)
# current verison
packageVersion("cdcfluview")
flu <- get_flu_data("hhs", sub_region=1:10, "ilinet", years=2014)
dplyr::glimpse(flu)
gg <- ggplot(flu, aes(x=WEEK, y=X..WEIGHTED.ILI, group=REGION))
gg <- gg + geom_line()
gg <- gg + facet_wrap(~REGION, ncol=2)
gg <- gg + theme_bw()
```
```{r echo=FALSE, fig.height=10, fig.width=6}
gg
```
### Test Results
```{r}
library(cdcfluview)
library(testthat)
date()
test_dir("tests/")
```

83
README.md

@ -0,0 +1,83 @@
The CDC's FluView is a Flash portal and the only way to get flu season data is to use GUI controls, making it tedious to retrieve updates. This package uses the same API the portal does to programmatically retrieve data.
The following functions are implemented:
- `get_flu_data` : retrieve flu data
The following data sets are included:
### News
- Version 0.1 released
### Installation
``` r
devtools::install_github("hrbrmstr/cdcfluview")
```
### Usage
``` r
library(cdcfluview)
```
## Loading required package: httr
``` r
library(ggplot2)
# current verison
packageVersion("cdcfluview")
```
## [1] '0.1'
``` r
flu <- get_flu_data("hhs", sub_region=1:10, "ilinet", years=2014)
dplyr::glimpse(flu)
```
## Variables:
## $ REGION.TYPE (chr) "HHS Regions", "HHS Regions", "HHS Regions", "HHS Regions", "HHS Regions", "HHS Regions",...
## $ REGION (chr) "Region 1", "Region 2", "Region 3", "Region 4", "Region 5", "Region 6", "Region 7", "Regi...
## $ YEAR (int) 2014, 2014, 2014, 2014, 2014, 2014, 2014, 2014, 2014, 2014, 2014, 2014, 2014, 2014, 2014,...
## $ WEEK (int) 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 41, 41, 41, 41, 41, 41, 41, 41, 41, 41, 42, 42, 4...
## $ ILITOTAL (int) 352, 2239, 1689, 1173, 1083, 1843, 217, 348, 1201, 61, 386, 2108, 1735, 1501, 1117, 2163,...
## $ TOTAL.PATIENTS (int) 50896, 134096, 128589, 127408, 106896, 103717, 50032, 36991, 85312, 10868, 50711, 129275,...
## $ NUM..OF.PROVIDERS (int) 142, 253, 242, 299, 266, 236, 83, 117, 227, 53, 148, 242, 238, 305, 277, 246, 83, 114, 24...
## $ X..WEIGHTED.ILI (dbl) 0.8825503, 1.8170454, 1.2055377, 0.8357537, 0.7384711, 1.8292926, 0.6895413, 0.6733888, 1...
## $ X.UNWEIGHTED.ILI (dbl) 0.6916064, 1.6696993, 1.3134872, 0.9206643, 1.0131343, 1.7769507, 0.4337224, 0.9407694, 1...
## $ AGE.0.4 (int) 101, 872, 395, 330, 358, 465, 50, 82, 261, 22, 109, 837, 404, 353, 339, 560, 57, 58, 281,...
## $ AGE.5.24 (int) 185, 758, 627, 530, 400, 710, 97, 152, 532, 30, 199, 675, 664, 763, 443, 807, 124, 146, 5...
## $ AGE.25.64 (lgl) NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, N...
## $ AGE.25.49 (int) 44, 351, 451, 187, 181, 469, 42, 87, 202, 7, 37, 338, 461, 248, 182, 509, 54, 87, 216, 20...
## $ AGE.50.64 (int) 13, 150, 126, 80, 80, 121, 15, 19, 101, 1, 24, 148, 131, 73, 105, 187, 17, 23, 117, 10, 2...
## $ AGE.65 (int) 9, 108, 90, 46, 64, 78, 13, 8, 105, 1, 17, 110, 75, 64, 48, 100, 11, 12, 97, 3, 8, 108, 8...
``` r
gg <- ggplot(flu, aes(x=WEEK, y=X..WEIGHTED.ILI, group=REGION))
gg <- gg + geom_line()
gg <- gg + facet_wrap(~REGION, ncol=2)
gg <- gg + theme_bw()
```
![](README_files/figure-markdown_github/unnamed-chunk-4-1.png)
### Test Results
``` r
library(cdcfluview)
library(testthat)
date()
```
## [1] "Sat Jan 10 20:25:05 2015"
``` r
test_dir("tests/")
```
## basic functionality :

BIN
README_files/figure-markdown_github/unnamed-chunk-4-1.png

Binary file not shown.

After

Width:  |  Height:  |  Size: 64 KiB

21
cdcfluview.Rproj

@ -0,0 +1,21 @@
Version: 1.0
RestoreWorkspace: Default
SaveWorkspace: Default
AlwaysSaveHistory: Default
EnableCodeIndexing: Yes
UseSpacesForTab: Yes
NumSpacesForTab: 2
Encoding: UTF-8
RnwWeave: Sweave
LaTeX: pdfLaTeX
StripTrailingWhitespace: Yes
BuildType: Package
PackageUseDevtools: Yes
PackageInstallArgs: --no-multiarch --with-keep.source
PackageBuildArgs: --resave-data
PackageRoxygenize: rd,collate,namespace

14
man/cdcfluview.Rd

@ -0,0 +1,14 @@
% Generated by roxygen2 (4.1.0): do not edit by hand
% Please edit documentation in R/cdcfluview-package.R
\docType{package}
\name{cdcfluview}
\alias{cdcfluview}
\alias{cdcfluview-package}
\title{A package to retrive data behind the CDC FluView portal}
\description{
A package to retrive data behind the CDC FluView portal
}
\author{
Bob Rudis (@hrbrmstr)
}

36
man/get_flu_data.Rd

@ -0,0 +1,36 @@
% Generated by roxygen2 (4.1.0): do not edit by hand
% Please edit documentation in R/cdcfluview.R
\name{get_flu_data}
\alias{get_flu_data}
\title{Retrieve CDC flu data}
\usage{
get_flu_data(region = "hhs", sub_region = 1:10, data_source = "ilinet",
years = 2014)
}
\arguments{
\item{region}{one of "\code{hhs}", "\code{census}", "\code{national}"}
\item{sub_region}{depends on the \code{region_type}.\cr
For "\code{national}", the \code{sub_region} should be \code{NA}.\cr
For "\code{hhs}", should be a vector between \code{1:10}.\cr
For "\code{census}", should be a vector between \code{1:9}}
\item{data_source}{either of "\code{who}" (for WHO NREVSS) or "\code{ilinet}" or "\code{all}" (for both)}
\item{years}{a vector of years to retrieve data for (i.e. \code{2014} for CDC flu seasn 2014-2015)}
}
\value{
If only a single \code{data_source} is specified, then a single \code{data.frame} is
returned, otherwise a named list with each \code{data.frame} is returned.
}
\description{
Uses the data source from the CDC FluView \url{http://gis.cdc.gov/grasp/fluview/fluportaldashboard.html}
and provides flu reporting data as either a single data frame or a list
of data frames (depending on whether either WHO NREVSS or ILINet - or both - is chosen)
}
\examples{
\dontrun{
flu <- get_flu_data("hhs", 1:10, c("who", "ilinet"), years=2000:2014)
}
}

2
tests/test-all.R

@ -0,0 +1,2 @@
library(testthat)
test_check("cdcfluview")

6
tests/testthat/test-cdcfluview.R

@ -0,0 +1,6 @@
context("basic functionality")
test_that("we can do something", {
#expect_that(some_function(), is_a("data.frame"))
})
Loading…
Cancel
Save