diff --git a/.Rbuildignore b/.Rbuildignore index 3f2fc89b..697d8b52 100644 --- a/.Rbuildignore +++ b/.Rbuildignore @@ -20,4 +20,7 @@ ^.venv$ ^env$ ^.env$ +^README\.Rmd$ ^CRAN-SUBMISSION$ +^LICENSE\.md$ +^revdep$ diff --git a/.bumpversion.cfg b/.bumpversion.cfg index c4459027..f6301400 100644 --- a/.bumpversion.cfg +++ b/.bumpversion.cfg @@ -1,5 +1,5 @@ [bumpversion] -current_version = 1.0.0 +current_version = 1.0.0.9000 commit = False tag = False diff --git a/.github/CODEOWNERS b/.github/CODEOWNERS index 16f04afb..b8a5df51 100644 --- a/.github/CODEOWNERS +++ b/.github/CODEOWNERS @@ -1 +1 @@ -* @dshemetov @brookslogan @dsweber2 +* @dshemetov @brookslogan @dsweber2 @nmdefries diff --git a/.github/pull_request_template.md b/.github/pull_request_template.md new file mode 100644 index 00000000..ee44a838 --- /dev/null +++ b/.github/pull_request_template.md @@ -0,0 +1,22 @@ +### Checklist + +Please: + +- [ ] Make sure this PR is against "dev", not "main" (unless this is a release + PR). +- [ ] Request a review from one of the current epidatr main reviewers: + brookslogan, dshemetov, nmdefries, dsweber2. +- [ ] Makes sure to bump the version number in `DESCRIPTION`. Always increment + the patch version number (the third number), unless you are making a + release PR from dev to main, in which case increment the minor version + number (the second number). +- [ ] Describe changes made in NEWS.md, making sure breaking changes + (backwards-incompatible changes to the documented interface) are noted. + Collect the changes under the next release number (e.g. if you are on + 1.7.2, then write your changes under the 1.8 heading). + +### Change explanations for reviewer + +### Magic GitHub syntax to mark associated Issue(s) as resolved when this is merged into the default branch + +- Resolves #{issue number} diff --git a/.github/workflows/R-CMD-check.yaml b/.github/workflows/R-CMD-check.yaml index 338f93d4..a0b910bd 100644 --- a/.github/workflows/R-CMD-check.yaml +++ b/.github/workflows/R-CMD-check.yaml @@ -5,6 +5,7 @@ on: branches: [main, dev] pull_request: branches: [main, dev] + workflow_dispatch: name: R-CMD-check diff --git a/.github/workflows/create_release.yml b/.github/workflows/create_release.yml deleted file mode 100644 index 2d82e6fd..00000000 --- a/.github/workflows/create_release.yml +++ /dev/null @@ -1,43 +0,0 @@ -name: Create Release -on: - workflow_dispatch: - inputs: - versionName: - description: "Semantic Version Number (i.e., 5.5.0 or patch, minor, major, prepatch, preminor, premajor, prerelease)" - required: true - default: patch -jobs: - create_release: - runs-on: ubuntu-latest - steps: - - name: Check out code - uses: actions/checkout@v2 - with: - ref: main - ssh-key: ${{ secrets.CMU_DELPHI_DEPLOY_MACHINE_SSH }} - - name: Reset main branch - run: | - git fetch origin dev:dev - git reset --hard dev - - name: Set up Python 3.8 - uses: actions/setup-python@v2 - with: - python-version: 3.8 - - name: Change version number - id: version - run: | - python -m pip install bump2version - echo -n "::set-output name=next_tag::" - bump2version --list ${{ github.event.inputs.versionName }} | grep new_version | sed -r s,"^.*=",, - - name: Create pull request into main - uses: peter-evans/create-pull-request@v3 - with: - branch: release/${{ steps.version.outputs.next_tag }} - commit-message: "chore: release ${{ steps.version.outputs.next_tag }}" - base: main - title: Release ${{ steps.version.outputs.next_tag }} - labels: chore - reviewers: krivard - assignees: krivard - body: | - Releasing ${{ steps.version.outputs.next_tag }}. diff --git a/.github/workflows/document.yaml b/.github/workflows/document.yaml index fb1ee6b5..17a85104 100644 --- a/.github/workflows/document.yaml +++ b/.github/workflows/document.yaml @@ -2,7 +2,8 @@ # Need help debugging build failures? Start at https://github.com/r-lib/actions#where-to-find-help on: push: - paths: ["R/**"] + paths: ["R/**", "README.Rmd"] + workflow_dispatch: name: Document @@ -26,17 +27,25 @@ jobs: - name: Install dependencies uses: r-lib/actions/setup-r-dependencies@v2 with: - extra-packages: any::roxygen2 - needs: roxygen2 + extra-packages: | + any::devtools + any::roxygen2 + needs: | + devtools + roxygen2 - name: Document run: roxygen2::roxygenise() shell: Rscript {0} + - name: Build README.md from README.Rmd + run: Rscript -e 'devtools::build_readme()' + - name: Commit and push changes run: | git config --local user.name "$GITHUB_ACTOR" git config --local user.email "$GITHUB_ACTOR@users.noreply.github.com" + git add README.md git add man/\* NAMESPACE DESCRIPTION git commit -m "docs: document (GHA)" || echo "No changes to commit" git pull --rebase diff --git a/.github/workflows/lint.yaml b/.github/workflows/lint.yaml index afd9fdbe..4eda2fd3 100644 --- a/.github/workflows/lint.yaml +++ b/.github/workflows/lint.yaml @@ -5,6 +5,7 @@ on: branches: [main, dev] pull_request: branches: [main, dev] + workflow_dispatch: name: lint diff --git a/.github/workflows/pkgdown.yaml b/.github/workflows/pkgdown.yaml index d25a7086..f7bf0f93 100644 --- a/.github/workflows/pkgdown.yaml +++ b/.github/workflows/pkgdown.yaml @@ -5,9 +5,9 @@ # update the documentation web site on pushes to `dev` branch. on: push: - branches: [main] + branches: [main, dev] pull_request: - branches: [main] + branches: [main, dev] release: types: [published] workflow_dispatch: @@ -23,7 +23,7 @@ jobs: group: pkgdown-${{ github.event_name != 'pull_request' || github.run_id }} env: GITHUB_PAT: ${{ secrets.GITHUB_TOKEN }} - DELPHI_EPIDATA_KEY: ${{ secrets.DELPHI_GITHUB_ACTIONS_EPIDATA_API_KEY }} + DELPHI_EPIDATA_KEY: ${{ secrets.SECRET_EPIDATR_GHACTIONS_DELPHI_EPIDATA_KEY }} steps: - uses: actions/checkout@v3 @@ -35,13 +35,29 @@ jobs: - uses: r-lib/actions/setup-r-dependencies@v2 with: - extra-packages: any::pkgdown, local::. + extra-packages: any::pkgdown, local::., any::cli needs: website - name: Build site - env: - DELPHI_EPIDATA_KEY: ${{ secrets.SECRET_EPIDATR_GHACTIONS_DELPHI_EPIDATA_KEY }} - run: pkgdown::build_site_github_pages(new_process = FALSE, install = FALSE) + run: | + override <- if (startsWith("${{ github.event_name }}", "pull_request")) { + if ("${{ github.base_ref }}" == "main") { + list(development = list(mode = "release", version_label = "light")) + } else { + list(development = list(mode = "devel", version_label = "success")) + } + } else { + if ("${{ github.ref_name }}" == "main") { + list(development = list(mode = "release", version_label = "light")) + } else { + list(development = list(mode = "devel", version_label = "success")) + } + } + pkg <- pkgdown::as_pkgdown(".", override = override) + cli::cli_rule("Cleaning files from old site...") + pkgdown::clean_site(pkg) + pkgdown::build_site(pkg, preview = FALSE, install = FALSE, new_process = FALSE) + pkgdown:::build_github_pages(pkg) shell: Rscript {0} - name: Deploy to GitHub pages 🚀 diff --git a/.github/workflows/release_helper.yml b/.github/workflows/release_helper.yml deleted file mode 100644 index 90e288ec..00000000 --- a/.github/workflows/release_helper.yml +++ /dev/null @@ -1,76 +0,0 @@ -name: Release Helper -on: - push: - branches: - - main - -jobs: - correct_repository: - runs-on: ubuntu-latest - steps: - - name: fail on fork - if: github.repository_owner != 'cmu-delphi' - run: exit 1 - - create_release: - needs: correct_repository - runs-on: ubuntu-latest - steps: - - name: Check out code - uses: actions/checkout@v2 - - name: Set up Python 3.8 - uses: actions/setup-python@v2 - with: - python-version: 3.8 - - name: Extract version - id: extract_version - run: | - python -m pip install bump2version - echo -n "::set-output name=version::" - bump2version --dry-run --list patch | grep ^current_version | sed -r s,"^.*=",, - - name: Create Release - id: create_release - uses: release-drafter/release-drafter@v5 - env: - GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }} - with: - version: ${{ steps.extract_version.outputs.version }} - publish: true - outputs: - version: ${{ steps.extract_version.outputs.version }} - upload_url: ${{ steps.create_release.outputs.upload_url }} - tag_name: ${{ steps.create_release.outputs.tag_name }} - - release_package: - needs: create_release - runs-on: ubuntu-latest - steps: - - name: Check out code - uses: actions/checkout@v2 - # TODO - - sync_dev: - needs: correct_repository - runs-on: ubuntu-latest - steps: - - name: Check out code - uses: actions/checkout@v2 - with: - ref: dev - ssh-key: ${{ secrets.CMU_DELPHI_DEPLOY_MACHINE_SSH }} - - name: Reset dev branch - run: | - git fetch origin main:main - git reset --hard main - - name: Create pull request into dev - uses: peter-evans/create-pull-request@v3 - with: - branch: bot/sync-main-dev - commit-message: "chore: sync main-dev" - base: dev - title: "chore: sync main->dev" - labels: chore - reviewers: dshemetov - assignees: dshemetov - body: | - Syncing Main->Dev. diff --git a/.github/workflows/style.yaml b/.github/workflows/style.yaml index c01a2da9..acdc0470 100644 --- a/.github/workflows/style.yaml +++ b/.github/workflows/style.yaml @@ -10,6 +10,7 @@ on: "**.[rR]nw", "**.[rR]profile", ] + workflow_dispatch: name: Style diff --git a/.gitignore b/.gitignore index 2ecf9b05..5a928afe 100644 --- a/.gitignore +++ b/.gitignore @@ -17,3 +17,6 @@ env /Meta/ .secrets epidatr.Rproj +renv.lock +renv/ +.Rprofile \ No newline at end of file diff --git a/.lintr b/.lintr index c0bfc243..c7c90554 100644 --- a/.lintr +++ b/.lintr @@ -3,3 +3,7 @@ linters: linters_with_defaults( cyclocomp_linter = NULL, object_length_linter(length = 40L) ) +exclusions: list( + "renv", + "venv" + ) diff --git a/CRAN-SUBMISSION b/CRAN-SUBMISSION index a0b6ffc6..7716e2f9 100644 --- a/CRAN-SUBMISSION +++ b/CRAN-SUBMISSION @@ -1,3 +1,3 @@ -Version: 1.0.0 -Date: 2023-09-12 08:00:50 UTC -SHA: 52436eb250eab1f9c70b250bf4ca1ab25cc48316 +Version: 1.1.0 +Date: 2024-02-27 20:25:04 UTC +SHA: 693c04bd80d3ffe0b3c012281303c4878de08c70 diff --git a/DESCRIPTION b/DESCRIPTION index 6f00eb30..b478a352 100644 --- a/DESCRIPTION +++ b/DESCRIPTION @@ -1,9 +1,8 @@ Package: epidatr Type: Package Title: Client for Delphi's 'Epidata' API -Version: 1.0.0 -Date: 2023-09-11 -Authors@R: +Version: 1.1.1 +Authors@R: c( person("Logan", "Brooks", email = "lcbrooks@andrew.cmu.edu", role = c("aut")), person("Dmitry", "Shemetov", email = "dshemeto@andrew.cmu.edu", role = c("aut")), @@ -35,14 +34,18 @@ Imports: MMWRweek, purrr, openssl, + rappdirs, readr, tibble, + usethis, xml2 -RoxygenNote: 7.2.3 +RoxygenNote: 7.3.1 Suggests: dplyr, ggplot2, knitr, + maps, + mapproj, rmarkdown, rlang, testthat (>= 3.1.5), @@ -50,7 +53,7 @@ Suggests: VignetteBuilder: knitr Language: en-US Config/testthat/edition: 3 -Collate: +Collate: 'auth.R' 'avail_endpoints.R' 'cache.R' diff --git a/DEVELOPMENT.md b/DEVELOPMENT.md index 95a93c25..63e3340f 100644 --- a/DEVELOPMENT.md +++ b/DEVELOPMENT.md @@ -1,32 +1,64 @@ -## Development Environment - -Relevant R commands +## Setting up the development environment ```r install.packages(c('devtools', 'pkgdown', 'styler', 'lintr')) # install dev dependencies devtools::install_deps(dependencies = TRUE) # install package dependencies devtools::document() # generate package meta data and man files devtools::build() # build package +``` + +## Validating the package + +```r styler::style_pkg() # format code -lintr::lint_package() # lint package +lintr::lint_package() # lint code + devtools::test() # test package devtools::check() # check package for errors ``` -## Release Process +## Developing the documentation site -The release consists of multiple steps which can be all done via the GitHub website: +Our CI builds two version of the documentation: + +- https://cmu-delphi.github.io/epidatr/ from the `main` branch and +- https://cmu-delphi.github.io/epidatr/dev from the `dev` branch. + +The documentation site can be previewed locally by running in R: + +```r +# Should automatically open a browser +pkgdown::build_site(preview=TRUE) +``` -1. Go to [create_release GitHub Action](https://github.com/cmu-delphi/epidatr/actions/workflows/create_release.yml) and click the `Run workflow` button. Enter the next version number or one of the magic keywords (patch, minor, major) and hit the green `Run workflow` button. -2. The action will prepare a new release and will end up with a new [Pull Request](https://github.com/cmu-delphi/epidatr/pulls) -3. Let the code owner review the PR and its changes and let the CI check whether everything builds successfully -4. Once approved and merged, another GitHub action job starts which automatically will - 1. create a git tag - 2. create another [Pull Request](https://github.com/cmu-delphi/epidatr/pulls) to merge the changes back to the `dev` branch - 3. create a [GitHub release](https://github.com/cmu-delphi/epidatr/releases) with automatically derived release notes -5. Release to CRAN +If the above does not open a browser, you can try using a Python server from the +command line: -[mit-image]: https://img.shields.io/badge/License-MIT-yellow.svg -[mit-url]: https://opensource.org/license/MIT -[github-actions-image]: https://github.com/cmu-delphi/epidatr/workflows/ci/badge.svg -[github-actions-url]: https://github.com/cmu-delphi/epidatr/actions +```bash +R -e 'devtools::document()' +R -e 'pkgdown::build_site()' +python -m http.server -d docs +``` + +## Versioning + +Please follow the guidelines in the [PR template document](.github/pull_request_template.md). + +## Release process +First, there's a handy function that makes a github issue; for example, at the time of writing we were doing: +```R +usethis::use_release_issue(version = "1.0.2") +``` +If you want to extend it, add to the `release_bullets` function in [utils.R](https://github.com/cmu-delphi/epidatr/blob/dev/R/utils.R). + First, make sure that all the checks pass + +```R +devtools::check(".", manual = TRUE, env_vars =c(NOT_CRAN = "false")) +``` + +Aim for 10/10, no notes. Generally, follow the issue. `revdep_check` is likely to fail but doesn't seem to be terribly important. So for now ignore it. + +When this has gone smoothly enough, release to CRAN via +```R +devtools::release(check = TRUE) +``` diff --git a/LICENSE b/LICENSE index c90c919a..94c71f45 100644 --- a/LICENSE +++ b/LICENSE @@ -1,2 +1,2 @@ YEAR: 2023 -COPYRIGHT HOLDER: Logan Brooks, Ryan Tibshirani +COPYRIGHT HOLDER: epidatr authors diff --git a/LICENSE.md b/LICENSE.md new file mode 100644 index 00000000..90c4cc71 --- /dev/null +++ b/LICENSE.md @@ -0,0 +1,21 @@ +# MIT License + +Copyright (c) 2023 epidatr authors + +Permission is hereby granted, free of charge, to any person obtaining a copy +of this software and associated documentation files (the "Software"), to deal +in the Software without restriction, including without limitation the rights +to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +copies of the Software, and to permit persons to whom the Software is +furnished to do so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in all +copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +SOFTWARE. diff --git a/NAMESPACE b/NAMESPACE index 5e0849a0..c6fed522 100644 --- a/NAMESPACE +++ b/NAMESPACE @@ -2,11 +2,14 @@ S3method(as_tibble,covidcast_data_signal_list) S3method(as_tibble,covidcast_data_source_list) +S3method(print,EpiRange) +S3method(print,EpidataFieldInfo) S3method(print,covidcast_data_signal) S3method(print,covidcast_data_signal_list) S3method(print,covidcast_data_source) S3method(print,covidcast_epidata) S3method(print,epidata_call) +S3method(print,fetch_args) export(avail_endpoints) export(cache_info) export(clear_cache) @@ -15,7 +18,7 @@ export(disable_cache) export(epirange) export(fetch) export(fetch_args_list) -export(get_auth_key) +export(get_api_key) export(pub_covid_hosp_facility) export(pub_covid_hosp_facility_lookup) export(pub_covid_hosp_state_timeseries) @@ -44,9 +47,11 @@ export(pvt_norostat) export(pvt_quidel) export(pvt_sensors) export(pvt_twitter) +export(save_api_key) export(set_cache) import(cachem) import(glue) +importFrom(MMWRweek,MMWRweek) importFrom(MMWRweek,MMWRweek2Date) importFrom(checkmate,assert) importFrom(checkmate,assert_character) @@ -76,6 +81,7 @@ importFrom(openssl,md5) importFrom(purrr,map_chr) importFrom(purrr,map_lgl) importFrom(readr,read_csv) +importFrom(stats,na.omit) importFrom(tibble,as_tibble) importFrom(tibble,tibble) importFrom(utils,help.search) diff --git a/NEWS.md b/NEWS.md index 9dd1990e..25512ee5 100644 --- a/NEWS.md +++ b/NEWS.md @@ -1,3 +1,43 @@ +# epidatr 1.1.1 + +## Changes + +## Features + +## Patches +- Fixed failure when passing `as_of` values in `Date` format to + `pub_covidcast` while caching is enabled (#259) + +# epidatr 1.1.0 + +## Changes +- `pub_covid_hosp_state_timeseries` now supports use of the `as_of` parameter (#209). +- `release_date` and `latest_update` fields are now parsed as `Date`, rather + than as text. This change impacts several endpoints. +- `get_auth_key` renamed to `get_api_key` (#181). +- `get_api_key` no longer reads from R options and only uses environment variables (#217). +- `pvt_twitter` and `pub_wiki` now use `time_type` and `time_values` args instead of mutually exclusive `dates` and `epiweeks` (#236). This matches the interface of the `pub_covidcast` endpoint. +- Updated the default `timeout_seconds` to 15 minutes to allow large queries by default. +## Features +- Function reference now displays commonly-used functions first (#205). +- Support `Date` objects passed to version arguments `as_of` and `issues` in + endpoints (#192, #194). +- `clear_cache` now handles positional arguments just like `set_cache` (#197). +- `set_api_key` now available to help persist API key environment variables (#181, #217). +- All endpoints now support the use of "\*" as a wildcard to fetch all dates or epiweeks (#234). +## Patches +- Endpoints now fail when passed misspelled arguments (#187, #201). +- `pub_fluview_meta` fixed to `fetch` the response automatically. +- `pub_covid_hosp_state_timeseries` now correctly parses the `issue` field, + instead of returning a missing value (#202). +- In `pub_fluview_meta`, `latest_issue` field is now parsed as epiweek, rather + than being parsed as `Date` and returning a missing value. +- `set_cache` cache size no longer runs into integer overflow (#189). +- Improve line-wrapping of warning messages (#191). +- Fix documentation related to CRAN submission. +- Fix some errors from passing "" as a key. +- Fixed bug with NAs when parsing ints (#243). + # epidatr 1.0.0 - Add `set_cache` and other caching functions. diff --git a/R/auth.R b/R/auth.R index 1dbaaf43..53ff13b5 100644 --- a/R/auth.R +++ b/R/auth.R @@ -1,36 +1,77 @@ -#' Getting the API key +#' Get and set API keys #' -#' @description -#' Get the API key from the environment variable `DELPHI_EPIDATA_KEY` or -#' `getOption("delphi.epidata.key")`. +#' Get and set the API key used to make requests to the Epidata API. Without a +#' key, requests may be subject to rate limits and other limitations. #' -#' @return The API key as a string or "". +#' We recommend you register for an API key. While most endpoints are available +#' without one, there are [limits on API usage for anonymous +#' users](https://cmu-delphi.github.io/delphi-epidata/api/api_keys.html), +#' including a rate limit. If you regularly request large amounts of data, +#' please consider [registering for an API +#' key](https://api.delphi.cmu.edu/epidata/admin/registration_form). +#' +#' API keys are strings read from the environment variable `DELPHI_EPIDATA_KEY`. +#' We recommend setting your key with `save_api_key()`, which will modify an +#' applicable `.Renviron` file, which will be read in automatically when you +#' start future R sessions (see [`?Startup`][base::Startup] for details on +#' `.Renviron` files). Alternatively, you can modify the environment variable at +#' the command line before/while launching R, or inside an R session with +#' [`Sys.setenv()`], but these will not persist across sessions. +#' +#' Once an API key is set, it is automatically used for all requests made by +#' functions in this package. +#' +#' @return For `get_api_key()`, returns the current API key as a string, or +#' `""` if none is set. +#' +#' @references +#' - [Delphi Epidata API Keys +#' documentation](https://cmu-delphi.github.io/delphi-epidata/api/api_keys.html). +#' - [Delphi Epidata API Registration +#' Form](https://api.delphi.cmu.edu/epidata/admin/registration_form). #' #' @export -get_auth_key <- function() { +get_api_key <- function() { key <- Sys.getenv("DELPHI_EPIDATA_KEY", unset = "") if (key != "") { return(key) } - key <- getOption("delphi.epidata.key", default = "") - if (key != "") { - return(key) - } - cli::cli_warn( c( - "No API key found. You will be limited to non-complex queries and encounter rate limits if you proceed. - To avoid this, you can get your key by registering - at https://api.delphi.cmu.edu/epidata/admin/registration_form and then:", - "i" = "set the environment variable DELPHI_EPIDATA_KEY", - "i" = "set the option 'delphi.epidata.key'", - "", - "To save your key for later sessions (and hide it from your code), you can edit your .Renviron file with:", - "i" = "usethis::edit_r_environ()" + "No API key found. You will be limited to non-complex queries and encounter rate limits if you proceed.", + "i" = "See {.help save_api_key} for details on obtaining and setting API keys." ), .frequency = "regularly", .frequency_id = "delphi.epidata.key" ) return("") } + +#' @rdname get_api_key +#' @export +save_api_key <- function() { + cli::cli_inform( + c( + "i" = "This function will open your {.code .Renviron} file in a text editor. You will need to + write {.code DELPHI_EPIDATA_KEY=yourkeyhere} (without quotes) in the file and save it. If the editor + does not open, you will need to edit the file manually.", + "i" = "Press enter to continue." + ) + ) + readline() + + if (file.exists(usethis::proj_path(".Renviron"))) { + usethis::edit_r_environ(scope = "project") + + cat("\n\n") + cli::cli_inform( + c( + "i" = "Your project {.code .Renviron} file has been updated. Make sure not to share this + file (add it to .gitignore or equivalents)." + ) + ) + } else { + usethis::edit_r_environ(scope = "user") + } +} diff --git a/R/avail_endpoints.R b/R/avail_endpoints.R index 7677076d..991dff78 100644 --- a/R/avail_endpoints.R +++ b/R/avail_endpoints.R @@ -1,11 +1,13 @@ -#' List all available endpoints. +#' List all available Epidata API endpoints #' #' @description -#' A function that prints a tibble with two columns: `Endpoint` contains the -#' function for accessing the Delphi Epidata API endpoint along with a -#' `Description`. +#' Fetches a data frame of all Epidata API endpoints that can be accessed using +#' this package, with a brief description. #' -#' @return A [`tibble::tibble`]. +#' @return A [`tibble::tibble`] of endpoints, with two columns: +#' \item{Endpoint}{Name of the function for accessing this API endpoint.} +#' \item{Description}{One-sentence description of the data available at the +#' endpoint.} #' @export #' @importFrom utils help.search #' @@ -20,5 +22,6 @@ avail_endpoints <- function() { Endpoint = paste0(h$Name, "()"), Description = h$Title ) + cli::cli_inform(c("i" = "Data is available for the US only, unless otherwise specified")) tib %>% print(n = 50) } diff --git a/R/cache.R b/R/cache.R index dda3d15f..bc30b48f 100644 --- a/R/cache.R +++ b/R/cache.R @@ -34,7 +34,7 @@ cache_environ$epidatr_cache <- NULL #' specify either `issues` before a certain date, or `as_of` before a certain #' date will actually cache. For example the call #' ``` -#' covidcast( +#' pub_covidcast( #' source = "jhu-csse", #' signals = "confirmed_7dav_incidence_prop", #' geo_type = "state", @@ -46,7 +46,7 @@ cache_environ$epidatr_cache <- NULL #' *won't* cache, since it is possible for the cache to be invalidated by new #' releases with no warning. On the other hand, the call #' ``` -#' covidcast( +#' pub_covidcast( #' source = "jhu-csse", #' signals = "confirmed_7dav_incidence_prop", #' geo_type = "state", @@ -76,9 +76,9 @@ cache_environ$epidatr_cache <- NULL #' ) #' #' @param cache_dir the directory in which the cache is stored. By default, this -#' is `tools::R_user_dir()` if on R 4.0+, but must be specified for earlier -#' versions of R. The path can be either relative or absolute. The -#' environmental variable is `EPIDATR_CACHE_DIR`. +#' is `rappdirs::user_cache_dir("R", version = "epidatr")`. The path can be +#' either relative or absolute. The environmental variable is +#' `EPIDATR_CACHE_DIR`. #' @param days the maximum length of time in days to keep any particular cached #' call. By default this is `1`. The environmental variable is #' `EPIDATR_CACHE_MAX_AGE_DAYS`. @@ -90,6 +90,8 @@ cache_environ$epidatr_cache <- NULL #' variable is `EPIDATR_CACHE_LOGFILE`. #' @param confirm whether to confirm directory creation. default is `TRUE`; #' should only be set in non-interactive scripts +#' @param startup indicates whether the function is being called on +#' startup. Affects suppressability of the messages. Default is `FALSE`. #' @return [`NULL`] no return value, all effects are stored in the package #' environment #' @seealso [`clear_cache`] to delete the old cache while making a new one, @@ -102,9 +104,10 @@ set_cache <- function(cache_dir = NULL, days = NULL, max_size = NULL, logfile = NULL, - confirm = TRUE) { - if (is.null(cache_dir) && sessionInfo()$R.version$major >= 4) { - cache_dir <- Sys.getenv("EPIDATR_CACHE_DIR", unset = tools::R_user_dir("epidatr")) + confirm = TRUE, + startup = FALSE) { + if (is.null(cache_dir)) { + cache_dir <- Sys.getenv("EPIDATR_CACHE_DIR", unset = rappdirs::user_cache_dir("R", version = "epidatr")) } else if (is.null(cache_dir)) { # earlier version, so no tools cache_dir <- Sys.getenv("EPIDATR_CACHE_DIR") @@ -154,7 +157,6 @@ set_cache <- function(cache_dir = NULL, } } - if (!cache_usable) { print(glue::glue( "The directory at {cache_dir} is not accessible; check permissions and/or use a different ", @@ -163,11 +165,19 @@ set_cache <- function(cache_dir = NULL, } else if (cache_exists) { cache_environ$epidatr_cache <- cachem::cache_disk( dir = cache_dir, - max_size = as.integer(max_size * 1024^2), + max_size = max_size * 1024^2, max_age = days * 24 * 60 * 60, logfile = file.path(cache_dir, logfile) ) } + + cli::cli_inform(c( + "!" = "epidatr cache is being used (set env var EPIDATR_USE_CACHE=FALSE if not intended).", + "i" = "The cache directory is {cache_dir}.", + "i" = "The cache will be cleared after {days} day{ifelse(days>1,'s','')} + and will be pruned if it exceeds {max_size} MB.", + "i" = "The log of cache transactions is stored at {file.path(cache_dir, logfile)}." + ), class = if (startup) "packageStartupMessage" else NULL) } #' Manually reset the cache, deleting all currently saved data and starting afresh @@ -185,7 +195,7 @@ set_cache <- function(cache_dir = NULL, #' [`disable_cache`] to only disable without deleting, and [`cache_info`] #' @export #' @import cachem -clear_cache <- function(disable = FALSE, ...) { +clear_cache <- function(..., disable = FALSE) { if (any(!is.na(cache_environ$epidatr_cache))) { cache_environ$epidatr_cache$destroy() } @@ -252,12 +262,12 @@ cache_epidata_call <- function(epidata_call, fetch_args = fetch_args_list()) { if (as_of_recent || issues_recent) { cli::cli_warn( c( - "using cached results with `as_of` within the past week (or the future!).", - "This will likely result in an invalid cache. Consider\n", - "1. disabling the cache for this session with `disable_cache` or permanently with environmental ", - "variable `EPIDATR_USE_CACHE=FALSE`\n", - "2. setting `EPIDATR_CACHE_MAX_AGE_DAYS={Sys.getenv('EPIDATR_CACHE_MAX_AGE_DAYS', unset = 1)}`", - " to e.g. `3/24` (3 hours)." + "Using cached results with `as_of` within the past week (or the future!). + This will likely result in an invalid cache. Consider", + "i" = "disabling the cache for this session with `disable_cache` or + permanently with environmental variable `EPIDATR_USE_CACHE=FALSE`", + "i" = "setting `EPIDATR_CACHE_MAX_AGE_DAYS={Sys.getenv('EPIDATR_CACHE_MAX_AGE_DAYS + ', unset = 1)}` to e.g. `3/24` (3 hours)." ), .frequency = "regularly", .frequency_id = "cache timing issues", @@ -267,8 +277,8 @@ cache_epidata_call <- function(epidata_call, fetch_args = fetch_args_list()) { if (!is.key_missing(cached)) { cli::cli_warn( c( - "loading from the cache at {cache_environ$epidatr_cache$info()$dir}; ", - "see {cache_environ$epidatr_cache$info()$logfile} for more details." + "Loading from the cache at {cache_environ$epidatr_cache$info()$dir}; + see {cache_environ$epidatr_cache$info()$logfile} for more details." ), .frequency = "regularly", .frequency_id = "using the cache", @@ -277,7 +287,6 @@ cache_epidata_call <- function(epidata_call, fetch_args = fetch_args_list()) { return(cached[[1]]) } } - 'which was saved on {format(cached[[2]],"%A %B %d, %Y")}, which took {round(cached[[3]][[3]], digits=5)} seconds.' # need to actually get the data, since its either not in the cache or we're not caching runtime <- system.time(if (epidata_call$only_supports_classic) { fetched <- fetch_classic(epidata_call, fetch_args) diff --git a/R/constants.R b/R/constants.R index b00768ca..2a4aa3d7 100644 --- a/R/constants.R +++ b/R/constants.R @@ -1,3 +1,3 @@ -version <- "1.0.0" +version <- "1.0.0.9000" http_headers <- httr::add_headers("User-Agent" = paste0("epidatr/", version), "Accept-Encoding" = "gzip") global_base_url <- "https://api.delphi.cmu.edu/epidata/" diff --git a/R/covidcast.R b/R/covidcast.R index 66263be1..32868499 100644 --- a/R/covidcast.R +++ b/R/covidcast.R @@ -127,7 +127,7 @@ print.covidcast_data_source <- function(x, ...) { #' ``` #' #' These objects can be used directly to fetch data, without requiring us to use -#' the `covidcast()` function. Simply use the `$call` attribute of the object: +#' the `pub_covidcast()` function. Simply use the `$call` attribute of the object: #' #' ```{r} #' epidata$signals$`fb-survey:smoothed_cli`$call("state", "pa", diff --git a/R/endpoints.R b/R/endpoints.R index da14c2bb..0146ca64 100644 --- a/R/endpoints.R +++ b/R/endpoints.R @@ -1,4 +1,4 @@ -#' CDC page hits +#' CDC total and by topic webpage visits #' #' @description #' API docs: @@ -14,14 +14,20 @@ #' #' @param auth string. Restricted access key (not the same as API key). #' @param locations character. Locations to fetch. -#' @param epiweeks [`timeset`]. Epiweeks to fetch. +#' @param epiweeks [`timeset`]. Epiweeks to fetch. Defaults to all ("*") dates. #' @param fetch_args [`fetch_args`]. Additional arguments to pass to `fetch()`. #' See `fetch_args_list()` for details. #' @return [`tibble::tibble`] #' #' @keywords endpoint #' @export -pvt_cdc <- function(auth, locations, epiweeks, fetch_args = fetch_args_list()) { +pvt_cdc <- function( + auth, + locations, + epiweeks = "*", + fetch_args = fetch_args_list()) { + epiweeks <- get_wildcard_equivalent_dates(epiweeks, "week") + assert_character_param("auth", auth, len = 1) assert_character_param("locations", locations) assert_timeset_param("epiweeks", epiweeks) @@ -51,7 +57,7 @@ pvt_cdc <- function(auth, locations, epiweeks, fetch_args = fetch_args_list()) { ) %>% fetch(fetch_args = fetch_args) } -#' COVID hospitalization facility identifiers +#' Helper for finding COVID hospitalization facilities #' #' @description #' API docs: @@ -89,6 +95,8 @@ pub_covid_hosp_facility_lookup <- function( zip = NULL, fips_code = NULL, fetch_args = fetch_args_list()) { + rlang::check_dots_empty() + assert_character_param("state", state, len = 1, required = FALSE) assert_character_param("ccn", ccn, len = 1, required = FALSE) assert_character_param("city", city, len = 1, required = FALSE) @@ -133,7 +141,7 @@ pub_covid_hosp_facility_lookup <- function( ) %>% fetch(fetch_args = fetch_args) } -#' COVID hospitalization data for specific facilities +#' COVID hospitalizations by facility #' #' @description #' API docs: @@ -153,30 +161,62 @@ pub_covid_hosp_facility_lookup <- function( #' hospital_pks = "100075", #' collection_weeks = epirange(20200101, 20200501) #' ) +#' +#' pub_covid_hosp_facility( +#' hospital_pks = "100075", +#' collection_weeks = epirange(202001, 202005) +#' ) #' } #' @param hospital_pks character. Facility identifiers. -#' @param collection_weeks [`timeset`]. Epiweeks to fetch. +#' @param collection_weeks [`timeset`]. Dates (corresponding to epiweeks) to +#' fetch. Defaults to all ("*") dates. #' @param ... not used for values, forces later arguments to bind by name #' @param publication_dates [`timeset`]. Publication dates to fetch. #' @param fetch_args [`fetch_args`]. Additional arguments to pass to `fetch()`. #' @return [`tibble::tibble`] #' +#' @importFrom checkmate test_class test_integerish test_character +#' #' @seealso [`pub_covid_hosp_facility()`], [`epirange()`] #' @keywords endpoint #' @export # pub_covid_hosp_facility <- function( hospital_pks, - collection_weeks, + collection_weeks = "*", ..., publication_dates = NULL, fetch_args = fetch_args_list()) { + rlang::check_dots_empty() + + collection_weeks <- get_wildcard_equivalent_dates(collection_weeks, "day") + assert_character_param("hospital_pks", hospital_pks) assert_timeset_param("collection_weeks", collection_weeks) assert_timeset_param("publication_dates", publication_dates, required = FALSE) collection_weeks <- parse_timeset_input(collection_weeks) publication_dates <- parse_timeset_input(publication_dates) + # Confusingly, the endpoint expects `collection_weeks` to be in day format, + # but correspond to epiweeks. Allow `collection_weeks` to be provided in + # either day or week format. + coercion_msg <- c( + "`collection_weeks` is in week format but `pub_covid_hosp_facility` + expects day format; dates will be converted to day format but may not + correspond exactly to desired time range" + ) + if (test_class(collection_weeks, "EpiRange") && nchar(collection_weeks$from) == 6) { + cli::cli_warn(coercion_msg, class = "epidatr__epirange_week_coercion") + collection_weeks <- reformat_epirange(collection_weeks, to_type = "day") + # Single week date. + } else if ( + (test_integerish(collection_weeks) || test_character(collection_weeks)) && + nchar(collection_weeks) == 6 + ) { + cli::cli_warn(coercion_msg, class = "epidatr__single_week_coercion") + collection_weeks <- parse_api_week(collection_weeks) + } + create_epidata_call( "covid_hosp_facility/", list( @@ -428,12 +468,70 @@ pub_covid_hosp_facility <- function( create_epidata_field_info( "total_patients_hosp_confirmed_influenza_and_covid_7d_avg", "float" + ), + create_epidata_field_info("geocoded_hospital_address", "text"), + create_epidata_field_info("hhs_ids", "text"), + create_epidata_field_info("is_corrected", "bool"), + create_epidata_field_info( + "previous_day_admission_adult_covid_confirmed_7_day_coverage", + "int" + ), + create_epidata_field_info( + "previous_day_admission_adult_covid_suspected_7_day_coverage", + "int" + ), + create_epidata_field_info( + "previous_day_admission_pediatric_covid_confirmed_7_day_coverage", + "int" + ), + create_epidata_field_info( + "previous_day_admission_pediatric_covid_suspected_7_day_coverage", + "int" + ), + create_epidata_field_info( + "previous_week_patients_covid_vaccinated_doses_all_7_day", + "int" + ), + create_epidata_field_info( + "previous_week_patients_covid_vaccinated_doses_all_7_day_sum", + "int" + ), + create_epidata_field_info( + "previous_week_patients_covid_vaccinated_doses_one_7_day", + "int" + ), + create_epidata_field_info( + "previous_week_patients_covid_vaccinated_doses_one_7_day_sum", + "int" + ), + create_epidata_field_info( + "previous_week_personnel_covid_vaccd_doses_administered_7_day", + "int" + ), + create_epidata_field_info( + "previous_week_personnel_covid_vaccd_doses_administered_7_day_sum", + "int" + ), + create_epidata_field_info("total_personnel_covid_vaccinated_doses_all_7_day", "int"), + create_epidata_field_info( + "total_personnel_covid_vaccinated_doses_all_7_day_sum", + "int" + ), + create_epidata_field_info("total_personnel_covid_vaccinated_doses_none_7_day", "int"), + create_epidata_field_info( + "total_personnel_covid_vaccinated_doses_none_7_day_sum", + "int" + ), + create_epidata_field_info("total_personnel_covid_vaccinated_doses_one_7_day", "int"), + create_epidata_field_info( + "total_personnel_covid_vaccinated_doses_one_7_day_sum", + "int" ) ) ) %>% fetch(fetch_args = fetch_args) } -#' COVID Hospitalization Data by State +#' COVID hospitalizations by state #' #' @description #' API docs: . @@ -454,35 +552,63 @@ pub_covid_hosp_facility <- function( #' } #' #' @param states character. Two letter state abbreviations. -#' @param dates [`timeset`]. Dates to fetch. -#' @param issues [`timeset`]. Optionally, the issues to fetch. If not set, the -#' most recent issue is returned. +#' @param dates [`timeset`]. Dates to fetch. Defaults to all ("*") dates. #' @param ... not used for values, forces later arguments to bind by name +#' @param as_of Date. Optionally, the as of date for the issues to fetch. If not +#' specified, the most recent data is returned. Mutually exclusive with +#' `issues`. +#' @param issues [`timeset`]. Optionally, the issue of the data to fetch. If not +#' specified, the most recent issue is returned. Mutually exclusive with +#' `as_of` or `lag`. #' @param fetch_args [`fetch_args`]. Additional arguments to pass to `fetch()`. #' @return [`tibble::tibble`] #' #' @keywords endpoint #' @export # -pub_covid_hosp_state_timeseries <- function(states, dates, ..., issues = NULL, fetch_args = fetch_args_list()) { +pub_covid_hosp_state_timeseries <- function( + states, + dates = "*", + ..., + as_of = NULL, + issues = NULL, + fetch_args = fetch_args_list()) { + # Check parameters + rlang::check_dots_empty() + + if (missing(states) || missing(dates)) { + stop( + "`states` and `dates` are both required" + ) + } + + if (sum(!is.null(issues), !is.null(as_of)) > 1) { + stop("`issues`and `as_of` are mutually exclusive") + } + + dates <- get_wildcard_equivalent_dates(dates, "day") + assert_character_param("states", states) assert_timeset_param("dates", dates) + assert_date_param("as_of", as_of, len = 1, required = FALSE) assert_timeset_param("issues", issues, required = FALSE) + dates <- parse_timeset_input(dates) issues <- parse_timeset_input(issues) + as_of <- parse_timeset_input(as_of) create_epidata_call( "covid_hosp_state_timeseries/", list( states = states, dates = dates, - issues = issues + issues = issues, + as_of = as_of ), list( create_epidata_field_info("state", "text"), create_epidata_field_info("issue", "date"), create_epidata_field_info("date", "date"), - create_epidata_field_info("issue", "date"), create_epidata_field_info("critical_staffing_shortage_today_yes", "bool"), create_epidata_field_info("critical_staffing_shortage_today_no", "bool"), create_epidata_field_info("critical_staffing_shortage_today_not_reported", "bool"), @@ -588,7 +714,157 @@ pub_covid_hosp_state_timeseries <- function(states, dates, ..., issues = NULL, f create_epidata_field_info("percent_of_inpatients_with_covid", "float"), create_epidata_field_info("inpatient_bed_covid_utilization", "float"), create_epidata_field_info("adult_icu_bed_covid_utilization", "float"), - create_epidata_field_info("adult_icu_bed_utilization", "float") + create_epidata_field_info("adult_icu_bed_utilization", "float"), + create_epidata_field_info("geocoded_state", "text"), + create_epidata_field_info("deaths_covid", "int"), + create_epidata_field_info("deaths_covid_coverage", "int"), + create_epidata_field_info("icu_patients_confirmed_influenza", "int"), + create_epidata_field_info("icu_patients_confirmed_influenza_coverage", "int"), + create_epidata_field_info( + "on_hand_supply_therapeutic_a_casirivimab_imdevimab_courses", + "int" + ), + create_epidata_field_info("on_hand_supply_therapeutic_b_bamlanivimab_courses", "int"), + create_epidata_field_info( + "on_hand_supply_therapeutic_c_bamlanivimab_etesevimab_courses", + "int" + ), + create_epidata_field_info("previous_day_admission_adult_covid_confirmed_18_19", "int"), + create_epidata_field_info( + "previous_day_admission_adult_covid_confirmed_18_19_coverage", + "int" + ), + create_epidata_field_info("previous_day_admission_adult_covid_confirmed_20_29", "int"), + create_epidata_field_info( + "previous_day_admission_adult_covid_confirmed_20_29_coverage", + "int" + ), + create_epidata_field_info("previous_day_admission_adult_covid_confirmed_30_39", "int"), + create_epidata_field_info( + "previous_day_admission_adult_covid_confirmed_30_39_coverage", + "int" + ), + create_epidata_field_info("previous_day_admission_adult_covid_confirmed_40_49", "int"), + create_epidata_field_info( + "previous_day_admission_adult_covid_confirmed_40_49_coverage", + "int" + ), + create_epidata_field_info("previous_day_admission_adult_covid_confirmed_50_59", "int"), + create_epidata_field_info( + "previous_day_admission_adult_covid_confirmed_50_59_coverage", + "int" + ), + create_epidata_field_info("previous_day_admission_adult_covid_confirmed_60_69", "int"), + create_epidata_field_info( + "previous_day_admission_adult_covid_confirmed_60_69_coverage", + "int" + ), + create_epidata_field_info("previous_day_admission_adult_covid_confirmed_70_79", "int"), + create_epidata_field_info( + "previous_day_admission_adult_covid_confirmed_70_79_coverage", + "int" + ), + create_epidata_field_info( + "previous_day_admission_adult_covid_confirmed_80plus", + "int" + ), + create_epidata_field_info( + "previous_day_admission_adult_covid_confirmed_80plus_coverage", + "int" + ), + create_epidata_field_info( + "previous_day_admission_adult_covid_confirmed_unknown", + "int" + ), + create_epidata_field_info( + "previous_day_admission_adult_covid_confirmed_unknown_coverage", + "int" + ), + create_epidata_field_info("previous_day_admission_adult_covid_suspected_18_19", "int"), + create_epidata_field_info( + "previous_day_admission_adult_covid_suspected_18_19_coverage", + "int" + ), + create_epidata_field_info("previous_day_admission_adult_covid_suspected_20_29", "int"), + create_epidata_field_info( + "previous_day_admission_adult_covid_suspected_20_29_coverage", + "int" + ), + create_epidata_field_info("previous_day_admission_adult_covid_suspected_30_39", "int"), + create_epidata_field_info( + "previous_day_admission_adult_covid_suspected_30_39_coverage", + "int" + ), + create_epidata_field_info("previous_day_admission_adult_covid_suspected_40_49", "int"), + create_epidata_field_info( + "previous_day_admission_adult_covid_suspected_40_49_coverage", + "int" + ), + create_epidata_field_info("previous_day_admission_adult_covid_suspected_50_59", "int"), + create_epidata_field_info( + "previous_day_admission_adult_covid_suspected_50_59_coverage", + "int" + ), + create_epidata_field_info("previous_day_admission_adult_covid_suspected_60_69", "int"), + create_epidata_field_info( + "previous_day_admission_adult_covid_suspected_60_69_coverage", + "int" + ), + create_epidata_field_info("previous_day_admission_adult_covid_suspected_70_79", "int"), + create_epidata_field_info( + "previous_day_admission_adult_covid_suspected_70_79_coverage", + "int" + ), + create_epidata_field_info( + "previous_day_admission_adult_covid_suspected_80plus", + "int" + ), + create_epidata_field_info( + "previous_day_admission_adult_covid_suspected_80plus_coverage", + "int" + ), + create_epidata_field_info( + "previous_day_admission_adult_covid_suspected_unknown", + "int" + ), + create_epidata_field_info( + "previous_day_admission_adult_covid_suspected_unknown_coverage", + "int" + ), + create_epidata_field_info("previous_day_admission_influenza_confirmed", "int"), + create_epidata_field_info( + "previous_day_admission_influenza_confirmed_coverage", + "int" + ), + create_epidata_field_info("previous_day_deaths_covid_and_influenza", "int"), + create_epidata_field_info("previous_day_deaths_covid_and_influenza_coverage", "int"), + create_epidata_field_info("previous_day_deaths_influenza", "int"), + create_epidata_field_info("previous_day_deaths_influenza_coverage", "int"), + create_epidata_field_info( + "previous_week_therapeutic_a_casirivimab_imdevimab_courses_used", + "int" + ), + create_epidata_field_info( + "previous_week_therapeutic_b_bamlanivimab_courses_used", + "int" + ), + create_epidata_field_info( + "previous_week_therapeutic_c_bamlanivimab_etesevimab_courses_used", + "int" + ), + create_epidata_field_info( + "total_patients_hospitalized_confirmed_influenza_covid", + "int" + ), + create_epidata_field_info( + "total_patients_hospitalized_confirmed_influenza_covid_coverage", + "int" + ), + create_epidata_field_info("total_patients_hospitalized_confirmed_influenza", "int"), + create_epidata_field_info( + "total_patients_hospitalized_confirmed_influenza_coverage", + "int" + ) ) ) %>% fetch(fetch_args = fetch_args) } @@ -626,6 +902,11 @@ pub_covidcast_meta <- function(fetch_args = fetch_args_list()) { categories = c("week", "day") ), + create_epidata_field_info( + "geo_type", + "categorical", + categories = c("nation", "msa", "hrr", "hhs", "state", "county", "dma") + ), create_epidata_field_info("min_time", "date"), create_epidata_field_info("max_time", "date"), create_epidata_field_info("num_locations", "int"), @@ -641,7 +922,7 @@ pub_covidcast_meta <- function(fetch_args = fetch_args_list()) { ) %>% fetch(fetch_args = fetch_args) } -#' COVID data via the covidcast endpoint +#' Various COVID and flu signals via the COVIDcast endpoint #' #' @description #' API docs: @@ -682,7 +963,7 @@ pub_covidcast_meta <- function(fetch_args = fetch_args_list()) { #' @param geo_values character. The geographies to return. "*" fetches #' all. (See: #' .) -#' @param time_values [`timeset`]. Dates to fetch. +#' @param time_values [`timeset`]. Dates to fetch. Defaults to all ("*") dates. #' @param ... not used for values, forces later arguments to bind by name #' @param as_of Date. Optionally, the as of date for the issues to fetch. If not #' specified, the most recent data is returned. Mutually exclusive with @@ -704,23 +985,26 @@ pub_covidcast <- function( signals, geo_type, time_type, - geo_values, - time_values, + geo_values = "*", + time_values = "*", ..., as_of = NULL, issues = NULL, lag = NULL, fetch_args = fetch_args_list()) { + rlang::check_dots_empty() + # Check parameters if ( missing(source) || missing(signals) || missing(time_type) || missing(geo_type) || - missing(time_values) || missing(geo_values) + missing(time_values) || + missing(geo_values) ) { stop( - "`source`, `signals`, `time_type`, `geo_type`, `time_values`, and `geo_value` are all required" + "`source`, `signals`, `time_type`, `geo_type`, `time_values`, and `geo_values` are all required" ) } @@ -781,7 +1065,7 @@ pub_covidcast <- function( ) %>% fetch(fetch_args = fetch_args) } -#' Delphi's ILINet forecasts +#' Delphi's ILINet outpatient doctor visits forecasts #' @description #' API docs: #' @@ -790,12 +1074,16 @@ pub_covidcast <- function( #' pub_delphi(system = "ec", epiweek = 201501) #' } #' @param system character. System name to fetch. -#' @param epiweek [`timeset`]. Epiweeks to fetch. +#' @param epiweek [`timeset`]. Epiweek to fetch. Does not support multiple dates. +#' Make separate calls to fetch data for multiple epiweeks. #' @param fetch_args [`fetch_args`]. Additional arguments to pass to `fetch()`. #' @return [`list`] #' @keywords endpoint #' @export -pub_delphi <- function(system, epiweek, fetch_args = fetch_args_list()) { +pub_delphi <- function( + system, + epiweek, + fetch_args = fetch_args_list()) { assert_character_param("system", system) assert_timeset_param("epiweek", epiweek, len = 1) epiweek <- parse_timeset_input(epiweek) @@ -812,7 +1100,7 @@ pub_delphi <- function(system, epiweek, fetch_args = fetch_args_list()) { ) %>% fetch(fetch_args = fetch_args) } -#' Delphi's PAHO Dengue nowcast +#' Delphi's PAHO dengue nowcasts (North and South America) #' @description #' API docs: #' @@ -824,12 +1112,17 @@ pub_delphi <- function(system, epiweek, fetch_args = fetch_args_list()) { #' ) #' } #' @param locations character. Locations to fetch. -#' @param epiweeks [`timeset`]. Epiweeks to fetch. +#' @param epiweeks [`timeset`]. Epiweeks to fetch. Defaults to all ("*") dates. #' @param fetch_args [`fetch_args`]. Additional arguments to pass to `fetch()`. #' @return [`tibble::tibble`] #' @keywords endpoint #' @export -pub_dengue_nowcast <- function(locations, epiweeks, fetch_args = fetch_args_list()) { +pub_dengue_nowcast <- function( + locations, + epiweeks = "*", + fetch_args = fetch_args_list()) { + epiweeks <- get_wildcard_equivalent_dates(epiweeks, "week") + assert_character_param("locations", locations) assert_timeset_param("epiweeks", epiweeks) epiweeks <- parse_timeset_input(epiweeks) @@ -846,7 +1139,7 @@ pub_dengue_nowcast <- function(locations, epiweeks, fetch_args = fetch_args_list ) %>% fetch(fetch_args = fetch_args) } -#' Dengue digital surveillance sensors in PAHO member countries +#' PAHO dengue digital surveillance sensors (North and South America) #' @description #' API docs: #' @@ -862,12 +1155,19 @@ pub_dengue_nowcast <- function(locations, epiweeks, fetch_args = fetch_args_list #' @param auth string. Restricted access key (not the same as API key). #' @param names character. Names to fetch. #' @param locations character. Locations to fetch. -#' @param epiweeks [`timeset`]. Epiweeks to fetch. +#' @param epiweeks [`timeset`]. Epiweeks to fetch. Defaults to all ("*") dates. #' @param fetch_args [`fetch_args`]. Additional arguments to pass to `fetch()`. #' @return [`tibble::tibble`] #' @keywords endpoint #' @export -pvt_dengue_sensors <- function(auth, names, locations, epiweeks, fetch_args = fetch_args_list()) { +pvt_dengue_sensors <- function( + auth, + names, + locations, + epiweeks = "*", + fetch_args = fetch_args_list()) { + epiweeks <- get_wildcard_equivalent_dates(epiweeks, "week") + assert_character_param("auth", auth, len = 1) assert_character_param("names", names) assert_character_param("locations", locations) @@ -891,7 +1191,7 @@ pvt_dengue_sensors <- function(auth, names, locations, epiweeks, fetch_args = fe ) %>% fetch(fetch_args = fetch_args) } -#' ECDC ILI data +#' ECDC ILI incidence (Europe) #' @description #' API docs: . #' @@ -907,7 +1207,7 @@ pvt_dengue_sensors <- function(auth, names, locations, epiweeks, fetch_args = fe #' pub_ecdc_ili(regions = "austria", epiweeks = epirange(201901, 202001)) #' } #' @param regions character. Regions to fetch. -#' @param epiweeks [`timeset`]. Epiweeks to fetch. +#' @param epiweeks [`timeset`]. Epiweeks to fetch. Defaults to all ("*") dates. #' @param ... not used for values, forces later arguments to bind by name #' @param issues [`timeset`]. Optionally, the issues to fetch. If not set, the #' most recent issue is returned. Mutually exclusive with `lag`. @@ -917,7 +1217,17 @@ pvt_dengue_sensors <- function(auth, names, locations, epiweeks, fetch_args = fe #' @return [`tibble::tibble`] #' @keywords endpoint #' @export -pub_ecdc_ili <- function(regions, epiweeks, ..., issues = NULL, lag = NULL, fetch_args = fetch_args_list()) { +pub_ecdc_ili <- function( + regions, + epiweeks = "*", + ..., + issues = NULL, + lag = NULL, + fetch_args = fetch_args_list()) { + rlang::check_dots_empty() + + epiweeks <- get_wildcard_equivalent_dates(epiweeks, "week") + assert_character_param("regions", regions) assert_timeset_param("epiweeks", epiweeks) assert_timeset_param("issues", issues, required = FALSE) @@ -947,11 +1257,11 @@ pub_ecdc_ili <- function(regions, epiweeks, ..., issues = NULL, lag = NULL, fetc ) %>% fetch(fetch_args = fetch_args) } -#' FluSurv hospitalization data +#' CDC FluSurv flu hospitalizations #' @description #' API docs: . #' -#' Obtain information on flu hospitalization rates from the Center of Disease +#' Obtain information on influenza hospitalization rates from the Center of Disease #' Control. #' #' See also . @@ -964,7 +1274,7 @@ pub_ecdc_ili <- function(regions, epiweeks, ..., issues = NULL, lag = NULL, fetc #' pub_flusurv(locations = "CA", epiweeks = epirange(201701, 201801)) #' } #' @param locations character. Character vector indicating location. -#' @param epiweeks [`timeset`]. Epiweeks to fetch. +#' @param epiweeks [`timeset`]. Epiweeks to fetch. Defaults to all ("*") dates. #' @param ... not used for values, forces later arguments to bind by name #' @param issues [`timeset`]. Optionally, the issues to fetch. If not set, the #' most recent issue is returned. Mutually exclusive with `lag`. @@ -974,7 +1284,17 @@ pub_ecdc_ili <- function(regions, epiweeks, ..., issues = NULL, lag = NULL, fetc #' @return [`tibble::tibble`] #' @keywords endpoint #' @export -pub_flusurv <- function(locations, epiweeks, ..., issues = NULL, lag = NULL, fetch_args = fetch_args_list()) { +pub_flusurv <- function( + locations, + epiweeks = "*", + ..., + issues = NULL, + lag = NULL, + fetch_args = fetch_args_list()) { + rlang::check_dots_empty() + + epiweeks <- get_wildcard_equivalent_dates(epiweeks, "week") + assert_character_param("locations", locations) assert_timeset_param("epiweeks", epiweeks) assert_timeset_param("issues", issues, required = FALSE) @@ -994,7 +1314,7 @@ pub_flusurv <- function(locations, epiweeks, ..., issues = NULL, lag = NULL, fet lag = lag ), list( - create_epidata_field_info("release_date", "text"), + create_epidata_field_info("release_date", "date"), create_epidata_field_info("location", "text"), create_epidata_field_info("issue", "epiweek"), create_epidata_field_info("epiweek", "epiweek"), @@ -1009,7 +1329,7 @@ pub_flusurv <- function(locations, epiweeks, ..., issues = NULL, lag = NULL, fet ) %>% fetch(fetch_args = fetch_args) } -#' FluView virological data from clinical labs +#' CDC FluView flu tests from clinical labs #' @description #' API docs: #' @@ -1020,7 +1340,7 @@ pub_flusurv <- function(locations, epiweeks, ..., issues = NULL, lag = NULL, fet #' @param regions character. Regions to fetch. #' @param epiweeks [`timeset`]. Epiweeks to fetch in the form #' epirange(startweek,endweek), where startweek and endweek are of the form -#' YYYYWW (string or numeric). +#' YYYYWW (string or numeric). Defaults to all ("*") dates. #' @param ... not used for values, forces later arguments to bind by name #' @param issues [`timeset`]. Optionally, the issues to fetch. If not set, the #' most recent issue is returned. Mutually exclusive with `lag`. @@ -1030,7 +1350,17 @@ pub_flusurv <- function(locations, epiweeks, ..., issues = NULL, lag = NULL, fet #' @return [`tibble::tibble`] #' @keywords endpoint #' @export -pub_fluview_clinical <- function(regions, epiweeks, ..., issues = NULL, lag = NULL, fetch_args = fetch_args_list()) { +pub_fluview_clinical <- function( + regions, + epiweeks = "*", + ..., + issues = NULL, + lag = NULL, + fetch_args = fetch_args_list()) { + rlang::check_dots_empty() + + epiweeks <- get_wildcard_equivalent_dates(epiweeks, "week") + assert_character_param("regions", regions) assert_timeset_param("epiweeks", epiweeks) assert_timeset_param("issues", issues, required = FALSE) @@ -1050,7 +1380,7 @@ pub_fluview_clinical <- function(regions, epiweeks, ..., issues = NULL, lag = NU lag = lag ), list( - create_epidata_field_info("release_date", "text"), + create_epidata_field_info("release_date", "date"), create_epidata_field_info("region", "text"), create_epidata_field_info("issue", "epiweek"), create_epidata_field_info("epiweek", "epiweek"), @@ -1065,10 +1395,10 @@ pub_fluview_clinical <- function(regions, epiweeks, ..., issues = NULL, lag = NU ) %>% fetch(fetch_args = fetch_args) } -#' FluView metadata +#' Metadata for the FluView endpoint #' @description #' API docs: -#' Returns information about the fluview endpoint. +#' #' @examples #' \dontrun{ #' pub_fluview_meta() @@ -1077,6 +1407,7 @@ pub_fluview_clinical <- function(regions, epiweeks, ..., issues = NULL, lag = NU #' @param fetch_args [`fetch_args`]. Additional arguments to pass to `fetch()`. #' #' @return [`tibble::tibble`] +#' @seealso [`pub_fluview()`] #' @keywords endpoint #' @export pub_fluview_meta <- function(fetch_args = fetch_args_list()) { @@ -1084,15 +1415,15 @@ pub_fluview_meta <- function(fetch_args = fetch_args_list()) { "fluview_meta/", list(), list( - create_epidata_field_info("latest_update", "text"), - create_epidata_field_info("latest_issue", "date"), + create_epidata_field_info("latest_update", "date"), + create_epidata_field_info("latest_issue", "epiweek"), create_epidata_field_info("table_rows", "int") ) - ) + ) %>% fetch(fetch_args = fetch_args) } -#' FluView ILINet data +#' CDC FluView ILINet outpatient doctor visits #' @description #' API docs: . For #' @@ -1114,7 +1445,7 @@ pub_fluview_meta <- function(fetch_args = fetch_args_list()) { #' on. Full list link below. #' @param epiweeks [`timeset`]. Epiweeks to fetch in the form #' `epirange(startweek, endweek)`, where startweek and endweek are of the form -#' YYYYWW (string or numeric). +#' YYYYWW (string or numeric). Defaults to all ("*") dates. #' @param ... not used for values, forces later arguments to bind by name #' @param issues [`timeset`]. Optionally, the issues to fetch. If not set, the #' most recent issue is returned. Mutually exclusive with `lag`. @@ -1128,12 +1459,16 @@ pub_fluview_meta <- function(fetch_args = fetch_args_list()) { #' @export pub_fluview <- function( regions, - epiweeks, + epiweeks = "*", ..., issues = NULL, lag = NULL, auth = NULL, fetch_args = fetch_args_list()) { + rlang::check_dots_empty() + + epiweeks <- get_wildcard_equivalent_dates(epiweeks, "week") + assert_character_param("regions", regions) assert_timeset_param("epiweeks", epiweeks) assert_timeset_param("issues", issues, required = FALSE) @@ -1156,13 +1491,14 @@ pub_fluview <- function( auth = auth ), list( - create_epidata_field_info("release_date", "text"), + create_epidata_field_info("release_date", "date"), create_epidata_field_info("region", "text"), create_epidata_field_info("issue", "epiweek"), create_epidata_field_info("epiweek", "epiweek"), create_epidata_field_info("lag", "int"), create_epidata_field_info("num_ili", "int"), create_epidata_field_info("num_patients", "int"), + create_epidata_field_info("num_providers", "int"), create_epidata_field_info("num_age_0", "int"), create_epidata_field_info("num_age_1", "int"), create_epidata_field_info("num_age_2", "int"), @@ -1175,7 +1511,7 @@ pub_fluview <- function( ) %>% fetch(fetch_args = fetch_args) } -#' Google Flu Trends data +#' Google Flu Trends flu search volume #' @description #' API docs: #' @@ -1195,13 +1531,18 @@ pub_fluview <- function( #' pub_gft(locations = "hhs1", epiweeks = epirange(201201, 202001)) #' } #' @param locations character. Locations to fetch. -#' @param epiweeks [`timeset`] Epiweeks to fetch. +#' @param epiweeks [`timeset`] Epiweeks to fetch. Defaults to all ("*") dates. #' @param fetch_args [`fetch_args`]. Additional arguments to pass to `fetch()`. #' #' @return [`tibble::tibble`] #' @keywords endpoint #' @export -pub_gft <- function(locations, epiweeks, fetch_args = fetch_args_list()) { +pub_gft <- function( + locations, + epiweeks = "*", + fetch_args = fetch_args_list()) { + epiweeks <- get_wildcard_equivalent_dates(epiweeks, "week") + assert_character_param("locations", locations) assert_timeset_param("epiweeks", epiweeks) epiweeks <- parse_timeset_input(epiweeks) @@ -1217,7 +1558,7 @@ pub_gft <- function(locations, epiweeks, fetch_args = fetch_args_list()) { ) %>% fetch(fetch_args = fetch_args) } -#' Google Health Trends data +#' Google Health Trends health topics search volume #' #' @description #' API docs: @@ -1235,13 +1576,20 @@ pub_gft <- function(locations, epiweeks, fetch_args = fetch_args_list()) { #' } #' @param auth string. Restricted access key (not the same as API key). #' @param locations character. Locations to fetch. -#' @param epiweeks [`timeset`]. Epiweeks to fetch. +#' @param epiweeks [`timeset`]. Epiweeks to fetch. Defaults to all ("*") dates. #' @param query string. The query to be fetched. #' @param fetch_args [`fetch_args`]. Additional arguments to pass to `fetch()`. #' @return [`tibble::tibble`] #' @keywords endpoint #' @export -pvt_ght <- function(auth, locations, epiweeks, query, fetch_args = fetch_args_list()) { +pvt_ght <- function( + auth, + locations, + epiweeks = "*", + query, + fetch_args = fetch_args_list()) { + epiweeks <- get_wildcard_equivalent_dates(epiweeks, "week") + assert_character_param("auth", auth, len = 1) assert_character_param("locations", locations) assert_timeset_param("epiweeks", epiweeks) @@ -1264,7 +1612,7 @@ pvt_ght <- function(auth, locations, epiweeks, query, fetch_args = fetch_args_li ) %>% fetch(fetch_args = fetch_args) } -#' KCDC ILI data +#' KCDC ILI incidence (Korea) #' @description #' API docs: #' @@ -1273,7 +1621,7 @@ pvt_ght <- function(auth, locations, epiweeks, query, fetch_args = fetch_args_li #' pub_kcdc_ili(regions = "ROK", epiweeks = 200436) #' } #' @param regions character. Regions to fetch. -#' @param epiweeks [`timeset`]. Epiweeks to fetch. +#' @param epiweeks [`timeset`]. Epiweeks to fetch. Defaults to all ("*") dates. #' @param ... not used for values, forces later arguments to bind by name #' @param issues [`timeset`]. Optionally, the issues to fetch. If not set, the #' most recent issue is returned. Mutually exclusive with `lag`. @@ -1283,7 +1631,17 @@ pvt_ght <- function(auth, locations, epiweeks, query, fetch_args = fetch_args_li #' @return [`tibble::tibble`] #' @keywords endpoint #' @export -pub_kcdc_ili <- function(regions, epiweeks, ..., issues = NULL, lag = NULL, fetch_args = fetch_args_list()) { +pub_kcdc_ili <- function( + regions, + epiweeks = "*", + ..., + issues = NULL, + lag = NULL, + fetch_args = fetch_args_list()) { + rlang::check_dots_empty() + + epiweeks <- get_wildcard_equivalent_dates(epiweeks, "week") + assert_character_param("regions", regions) assert_timeset_param("epiweeks", epiweeks) assert_timeset_param("issues", issues, required = FALSE) @@ -1303,7 +1661,7 @@ pub_kcdc_ili <- function(regions, epiweeks, ..., issues = NULL, lag = NULL, fetc lag = lag ), list( - create_epidata_field_info("release_date", "text"), + create_epidata_field_info("release_date", "date"), create_epidata_field_info("region", "text"), create_epidata_field_info("issue", "epiweek"), create_epidata_field_info("epiweek", "epiweek"), @@ -1313,7 +1671,7 @@ pub_kcdc_ili <- function(regions, epiweeks, ..., issues = NULL, lag = NULL, fetc ) %>% fetch(fetch_args = fetch_args) } -#' NoroSTAT metadata +#' Metadata for the NoroSTAT endpoint #' @description #' API docs: #' @@ -1324,6 +1682,7 @@ pub_kcdc_ili <- function(regions, epiweeks, ..., issues = NULL, lag = NULL, fetc #' @param auth string. Restricted access key (not the same as API key). #' @param fetch_args [`fetch_args`]. Additional arguments to pass to `fetch()`. #' @return [`list`] +#' @seealso [`pvt_norostat()`] #' @keywords endpoint #' @export pvt_meta_norostat <- function(auth, fetch_args = fetch_args_list()) { @@ -1336,7 +1695,7 @@ pvt_meta_norostat <- function(auth, fetch_args = fetch_args_list()) { ) %>% fetch(fetch_args = fetch_args) } -#' API metadata +#' Metadata for the Delphi Epidata API #' @description #' API docs: #' @@ -1349,7 +1708,7 @@ pub_meta <- function(fetch_args = fetch_args_list()) { create_epidata_call("meta/", list(), only_supports_classic = TRUE) %>% fetch(fetch_args = fetch_args) } -#' NIDSS dengue data +#' NIDSS dengue cases (Taiwan) #' @description #' API docs: #' @@ -1367,13 +1726,18 @@ pub_meta <- function(fetch_args = fetch_args_list()) { #' pub_nidss_dengue(locations = "taipei", epiweeks = epirange(201201, 201301)) #' } #' @param locations character. Locations to fetch. -#' @param epiweeks [`timeset`]. Epiweeks to fetch. +#' @param epiweeks [`timeset`]. Epiweeks to fetch. Defaults to all ("*") dates. #' @param fetch_args [`fetch_args`]. Additional arguments to pass to `fetch()`. #' #' @return [`tibble::tibble`] #' @keywords endpoint #' @export -pub_nidss_dengue <- function(locations, epiweeks, fetch_args = fetch_args_list()) { +pub_nidss_dengue <- function( + locations, + epiweeks = "*", + fetch_args = fetch_args_list()) { + epiweeks <- get_wildcard_equivalent_dates(epiweeks, "week") + assert_character_param("locations", locations) assert_timeset_param("epiweeks", epiweeks) epiweeks <- parse_timeset_input(epiweeks) @@ -1389,7 +1753,7 @@ pub_nidss_dengue <- function(locations, epiweeks, fetch_args = fetch_args_list() ) %>% fetch(fetch_args = fetch_args) } -#' NIDSS flu data +#' NIDSS flu doctor visits (Taiwan) #' @description #' API docs: #' @@ -1402,7 +1766,7 @@ pub_nidss_dengue <- function(locations, epiweeks, fetch_args = fetch_args_list() #' pub_nidss_flu(regions = "taipei", epiweeks = epirange(201501, 201601)) #' } #' @param regions character. Regions to fetch. -#' @param epiweeks [`timeset`]. Epiweeks to fetch. +#' @param epiweeks [`timeset`]. Epiweeks to fetch. Defaults to all ("*") dates. #' @param ... not used for values, forces later arguments to bind by name #' @param issues [`timeset`]. Optionally, the issues to fetch. If not set, the #' most recent issue is returned. Mutually exclusive with `lag`. @@ -1412,7 +1776,17 @@ pub_nidss_dengue <- function(locations, epiweeks, fetch_args = fetch_args_list() #' @return [`tibble::tibble`] #' @keywords endpoint #' @export -pub_nidss_flu <- function(regions, epiweeks, ..., issues = NULL, lag = NULL, fetch_args = fetch_args_list()) { +pub_nidss_flu <- function( + regions, + epiweeks = "*", + ..., + issues = NULL, + lag = NULL, + fetch_args = fetch_args_list()) { + rlang::check_dots_empty() + + epiweeks <- get_wildcard_equivalent_dates(epiweeks, "week") + assert_character_param("regions", regions) assert_timeset_param("epiweeks", epiweeks) assert_timeset_param("issues", issues, required = FALSE) @@ -1433,7 +1807,7 @@ pub_nidss_flu <- function(regions, epiweeks, ..., issues = NULL, lag = NULL, fet lag = lag ), list( - create_epidata_field_info("release_date", "text"), + create_epidata_field_info("release_date", "date"), create_epidata_field_info("region", "text"), create_epidata_field_info("epiweek", "epiweek"), create_epidata_field_info("issue", "epiweek"), @@ -1445,12 +1819,14 @@ pub_nidss_flu <- function(regions, epiweeks, ..., issues = NULL, lag = NULL, fet } -#' NoroSTAT data (point data, no min/max) +#' CDC NoroSTAT norovirus outbreaks #' @description +#' This is point data only, and does not include minima or maxima. +#' #' API docs: #' -#' This is the documentation of the API for accessing the NoroSTAT (norostat) -#' endpoint of the Delphi’s epidemiological data. +#' This is the documentation of the API for accessing the NoroSTAT endpoint of +#' the Delphi’s epidemiological data. #' #' @examples #' \dontrun{ @@ -1462,12 +1838,18 @@ pub_nidss_flu <- function(regions, epiweeks, ..., issues = NULL, lag = NULL, fet #' } #' @param auth string. Your authentication key. #' @param locations character. Locations to fetch. -#' @param epiweeks [`timeset`]. Epiweeks to fetch. +#' @param epiweeks [`timeset`]. Epiweeks to fetch. Defaults to all ("*") dates. #' @param fetch_args [`fetch_args`]. Additional arguments to pass to `fetch()`. #' @return [`tibble::tibble`] #' @keywords endpoint #' @export -pvt_norostat <- function(auth, locations, epiweeks, fetch_args = fetch_args_list()) { +pvt_norostat <- function( + auth, + locations, + epiweeks = "*", + fetch_args = fetch_args_list()) { + epiweeks <- get_wildcard_equivalent_dates(epiweeks, "week") + assert_character_param("auth", auth, len = 1) assert_character_param("locations", locations, len = 1) assert_timeset_param("epiweeks", epiweeks) @@ -1481,14 +1863,14 @@ pvt_norostat <- function(auth, locations, epiweeks, fetch_args = fetch_args_list epiweeks = epiweeks ), list( - create_epidata_field_info("release_date", "text"), + create_epidata_field_info("release_date", "date"), create_epidata_field_info("epiweek", "epiweek"), create_epidata_field_info("value", "int") ) ) %>% fetch(fetch_args = fetch_args) } -#' Delphi's ILI nowcast +#' Delphi's ILI Nearby nowcasts #' @description #' API docs: . #' @@ -1502,12 +1884,17 @@ pvt_norostat <- function(auth, locations, epiweeks, fetch_args = fetch_args_list #' pub_nowcast(locations = "ca", epiweeks = epirange(201201, 201301)) #' } #' @param locations character. Locations to fetch. -#' @param epiweeks [`timeset`]. Epiweeks to fetch. +#' @param epiweeks [`timeset`]. Epiweeks to fetch. Defaults to all ("*") dates. #' @param fetch_args [`fetch_args`]. Additional arguments to pass to `fetch()`. #' @return [`tibble::tibble`] #' @keywords endpoint #' @export -pub_nowcast <- function(locations, epiweeks, fetch_args = fetch_args_list()) { +pub_nowcast <- function( + locations, + epiweeks = "*", + fetch_args = fetch_args_list()) { + epiweeks <- get_wildcard_equivalent_dates(epiweeks, "week") + assert_character_param("locations", locations) assert_timeset_param("epiweeks", epiweeks) epiweeks <- parse_timeset_input(epiweeks) @@ -1524,7 +1911,7 @@ pub_nowcast <- function(locations, epiweeks, fetch_args = fetch_args_list()) { ) %>% fetch(fetch_args = fetch_args) } -#' PAHO Dengue data +#' PAHO dengue data (North and South America) #' @description #' API docs: #' @@ -1533,7 +1920,7 @@ pub_nowcast <- function(locations, epiweeks, fetch_args = fetch_args_list()) { #' pub_paho_dengue(regions = "ca", epiweeks = epirange(201401, 201501)) #' } #' @param regions character. Regions to fetch. -#' @param epiweeks [`timeset`]. Epiweeks to fetch. +#' @param epiweeks [`timeset`]. Epiweeks to fetch. Defaults to all ("*") dates. #' @param ... not used for values, forces later arguments to bind by name #' @param issues [`timeset`]. Optionally, the issues to fetch. If not set, the #' most recent issue is returned. Mutually exclusive with `lag`. @@ -1543,7 +1930,17 @@ pub_nowcast <- function(locations, epiweeks, fetch_args = fetch_args_list()) { #' @return [`tibble::tibble`] #' @keywords endpoint #' @export -pub_paho_dengue <- function(regions, epiweeks, ..., issues = NULL, lag = NULL, fetch_args = fetch_args_list()) { +pub_paho_dengue <- function( + regions, + epiweeks = "*", + ..., + issues = NULL, + lag = NULL, + fetch_args = fetch_args_list()) { + rlang::check_dots_empty() + + epiweeks <- get_wildcard_equivalent_dates(epiweeks, "week") + assert_character_param("regions", regions) assert_timeset_param("epiweeks", epiweeks) assert_timeset_param("issues", issues, required = FALSE) @@ -1560,7 +1957,7 @@ pub_paho_dengue <- function(regions, epiweeks, ..., issues = NULL, lag = NULL, f lag = lag ), list( - create_epidata_field_info("release_date", "text"), + create_epidata_field_info("release_date", "date"), create_epidata_field_info("region", "text"), create_epidata_field_info("serotype", "text"), create_epidata_field_info("epiweek", "epiweek"), @@ -1591,12 +1988,18 @@ pub_paho_dengue <- function(regions, epiweeks, ..., issues = NULL, lag = NULL, f #' } #' @param auth string. Restricted access key (not the same as API key). #' @param locations character. Locations to fetch. -#' @param epiweeks [`timeset`]. Epiweeks to fetch. +#' @param epiweeks [`timeset`]. Epiweeks to fetch. Defaults to all ("*") dates. #' @param fetch_args [`fetch_args`]. Additional arguments to pass to `fetch()`. #' @return [`tibble::tibble`] #' @keywords endpoint #' @export -pvt_quidel <- function(auth, locations, epiweeks, fetch_args = fetch_args_list()) { +pvt_quidel <- function( + auth, + locations, + epiweeks = "*", + fetch_args = fetch_args_list()) { + epiweeks <- get_wildcard_equivalent_dates(epiweeks, "week") + assert_character_param("auth", auth, len = 1) assert_character_param("locations", locations) assert_timeset_param("epiweeks", epiweeks) @@ -1617,12 +2020,12 @@ pvt_quidel <- function(auth, locations, epiweeks, fetch_args = fetch_args_list() ) %>% fetch(fetch_args = fetch_args) } -#' Digital surveillance sensors +#' Influenza and dengue digital surveillance sensors #' @description #' API docs: #' #' This is the documentation of the API for accessing the Digital Surveillance -#' Sensors (sensors) endpoint of the Delphi’s epidemiological Note: this +#' Sensors endpoint of the Delphi’s epidemiological. Note: this #' repository was built to support modeling and forecasting efforts #' surrounding seasonal influenza (and dengue). In the current COVID-19 #' pandemic, syndromic surveillance data, like ILI data (influenza-like @@ -1644,12 +2047,19 @@ pvt_quidel <- function(auth, locations, epiweeks, fetch_args = fetch_args_list() #' @param auth string. Restricted access key (not the same as API key). #' @param names character. Sensor names to fetch. #' @param locations character. Locations to fetch. -#' @param epiweeks [`timeset`]. Epiweeks to fetch. +#' @param epiweeks [`timeset`]. Epiweeks to fetch. Defaults to all ("*") dates. #' @param fetch_args [`fetch_args`]. Additional arguments to pass to `fetch()`. #' @return [`tibble::tibble`] #' @keywords endpoint #' @export -pvt_sensors <- function(auth, names, locations, epiweeks, fetch_args = fetch_args_list()) { +pvt_sensors <- function( + auth, + names, + locations, + epiweeks = "*", + fetch_args = fetch_args_list()) { + epiweeks <- get_wildcard_equivalent_dates(epiweeks, "week") + assert_character_param("auth", auth, len = 1) assert_character_param("names", names) assert_character_param("locations", locations) @@ -1673,42 +2083,63 @@ pvt_sensors <- function(auth, names, locations, epiweeks, fetch_args = fetch_arg ) %>% fetch(fetch_args = fetch_args) } -#' HealthTweets data +#' HealthTweets total and influenza-related tweets #' @description #' API docs: #' -#' This is the API documentation for accessing the Twitter Stream (twitter) endpoint of Delphi’s epidemiological data. -#' Sourced from [Healthtweets](http://www.healthtweets.org/) +#' This is the API documentation for accessing the Twitter Stream endpoint of +#' Delphi’s epidemiological data. Sourced from +#' [Healthtweets](http://www.healthtweets.org/) #' #' @examples #' \dontrun{ #' pvt_twitter( #' auth = Sys.getenv("SECRET_API_AUTH_TWITTER"), #' locations = "CA", -#' epiweeks = epirange(201501, 202001) +#' time_type = "week", +#' time_values = epirange(201501, 202001) #' ) #' } #' @param auth string. Restricted access key (not the same as API key). #' @param locations character. Locations to fetch. #' @param ... not used for values, forces later arguments to bind by name -#' @param dates [`timeset`]. Dates to fetch. Mutually exclusive with `epiweeks`. -#' @param epiweeks [`timeset`]. Epiweeks to fetch. Mutually exclusive with -#' `dates`. +#' @param time_type string. The temporal resolution of the data (either "day" or +#' "week", depending on signal). +#' @param time_values [`timeset`]. Dates or epiweeks to fetch. Defaults to all +#' ("*") dates. #' @param fetch_args [`fetch_args`]. Additional arguments to pass to `fetch()`. #' @return [`tibble::tibble`] #' @keywords endpoint #' @export -pvt_twitter <- function(auth, locations, ..., dates = NULL, epiweeks = NULL, fetch_args = fetch_args_list()) { +pvt_twitter <- function( + auth, + locations, + ..., + time_type = c("day", "week"), + time_values = "*", + fetch_args = fetch_args_list()) { + rlang::check_dots_empty() + + time_type <- match.arg(time_type) + if (time_type == "day") { + dates <- time_values + epiweeks <- NULL + dates <- get_wildcard_equivalent_dates(dates, "day") + } else { + dates <- NULL + epiweeks <- time_values + epiweeks <- get_wildcard_equivalent_dates(epiweeks, "week") + } + assert_character_param("auth", auth, len = 1) assert_character_param("locations", locations) + assert_character_param("time_type", time_type, len = 1) + assert_timeset_param("time_values", time_values) assert_timeset_param("dates", dates, required = FALSE) assert_timeset_param("epiweeks", epiweeks, required = FALSE) dates <- parse_timeset_input(dates) epiweeks <- parse_timeset_input(epiweeks) - if (!xor(is.null(dates), is.null(epiweeks))) { - stop("exactly one of `dates` and `epiweeks` is required") - } time_field <- if (!is.null(dates)) { create_epidata_field_info("date", "date") } else { @@ -1732,7 +2163,7 @@ pvt_twitter <- function(auth, locations, ..., dates = NULL, epiweeks = NULL, fet ) %>% fetch(fetch_args = fetch_args) } -#' Wikipedia access data +#' Wikipedia webpage counts by article #' @description #' API docs: # @@ -1746,13 +2177,18 @@ pvt_twitter <- function(auth, locations, ..., dates = NULL, epiweeks = NULL, fet #' #' @examples #' \dontrun{ -#' pub_wiki(articles = "avian_influenza", epiweeks = epirange(201501, 201601)) +#' pub_wiki( +#' articles = "avian_influenza", +#' time_type = "week", +#' time_values = epirange(201501, 201601) +#' ) #' } #' @param articles character. Articles to fetch. #' @param ... not used for values, forces later arguments to bind by name -#' @param dates [`timeset`]. Dates to fetch. Mutually exclusive with `epiweeks`. -#' @param epiweeks [`timeset`]. Epiweeks to fetch. Mutually exclusive with -#' `dates`. +#' @param time_type string. The temporal resolution of the data (either "day" or +#' "week", depending on signal). +#' @param time_values [`timeset`]. Dates or epiweeks to fetch. Defaults to all +#' ("*") dates. #' @param language string. Language to fetch. #' @param hours integer. Optionally, the hours to fetch. #' @param fetch_args [`fetch_args`]. Additional arguments to pass to `fetch()`. @@ -1762,12 +2198,27 @@ pvt_twitter <- function(auth, locations, ..., dates = NULL, epiweeks = NULL, fet pub_wiki <- function( articles, ..., - dates = NULL, - epiweeks = NULL, + time_type = c("day", "week"), + time_values = "*", hours = NULL, language = "en", fetch_args = fetch_args_list()) { + rlang::check_dots_empty() + + time_type <- match.arg(time_type) + if (time_type == "day") { + dates <- time_values + epiweeks <- NULL + dates <- get_wildcard_equivalent_dates(dates, "day") + } else { + dates <- NULL + epiweeks <- time_values + epiweeks <- get_wildcard_equivalent_dates(epiweeks, "week") + } + assert_character_param("articles", articles) + assert_character_param("time_type", time_type, len = 1) + assert_timeset_param("time_values", time_values) assert_timeset_param("dates", dates, required = FALSE) assert_timeset_param("epiweeks", epiweeks, required = FALSE) assert_integerish_param("hours", hours, required = FALSE) @@ -1775,9 +2226,6 @@ pub_wiki <- function( dates <- parse_timeset_input(dates) epiweeks <- parse_timeset_input(epiweeks) - if (!xor(is.null(dates), is.null(epiweeks))) { - stop("exactly one of `dates` and `epiweeks` is required") - } time_field <- if (!is.null(dates)) { create_epidata_field_info("date", "date") } else { diff --git a/R/epidatacall.R b/R/epidatacall.R index 3e2ad5ba..958e00aa 100644 --- a/R/epidatacall.R +++ b/R/epidatacall.R @@ -6,8 +6,8 @@ #' `epidata_call` objects are generated internally by endpoint functions like #' [`pub_covidcast`]; by default, they are piped directly into the `fetch` #' function to fetch and format the data. For most endpoints this will return -#' a tibble, but a few non-COVIDCAST endpoints only support will return a -#' JSON-like list instead. +#' a tibble, but a few non-COVIDCAST endpoints will return a JSON-like list +#' instead. #' #' @details #' `create_epidata_call` is the constructor for `epidata_call` objects, but you @@ -41,12 +41,38 @@ #' @return #' - For `create_epidata_call`: an `epidata_call` object #' +#' @importFrom purrr map_chr map_lgl create_epidata_call <- function(endpoint, params, meta = NULL, only_supports_classic = FALSE) { stopifnot(is.character(endpoint), length(endpoint) == 1) stopifnot(is.list(params)) stopifnot(is.null(meta) || is.list(meta)) + stopifnot(all(map_lgl(meta, ~ inherits(.x, "EpidataFieldInfo")))) stopifnot(is.logical(only_supports_classic), length(only_supports_classic) == 1) + + if (length(unique(meta)) != length(meta)) { + cli::cli_abort( + c( + "List of expected epidata fields contains duplicate entries", + "i" = "duplicates in meta can cause problems parsing fetched data", + "Please fix in `endpoints.R`" + ), + class = "epidatr__duplicate_meta_entries" + ) + } + + meta_field_names <- map_chr(meta, "name") + if (length(meta_field_names) != length(unique(meta_field_names))) { + cli::cli_abort( + c( + "List of expected epidata fields contains duplicate names", + "i" = "duplicates in meta can cause problems parsing fetched data", + "Please fix in `endpoints.R`" + ), + class = "epidatr__duplicate_meta_names" + ) + } + if (is.null(meta)) { meta <- list() } @@ -63,7 +89,7 @@ create_epidata_call <- function(endpoint, params, meta = NULL, } #' @importFrom checkmate test_class test_list -request_arguments <- function(epidata_call, format_type, fields = NULL) { +request_arguments <- function(epidata_call, format_type, fields) { stopifnot(inherits(epidata_call, "epidata_call")) stopifnot(format_type %in% c("json", "csv", "classic")) stopifnot(is.null(fields) || is.character(fields)) @@ -95,7 +121,6 @@ request_arguments <- function(epidata_call, format_type, fields = NULL) { #' @export print.epidata_call <- function(x, ...) { - stopifnot(inherits(x, "epidata_call")) cli::cli_h1(" object:") cli::cli_bullets(c( "*" = "Pipe this object into `fetch()` to actually fetch the data", @@ -103,53 +128,49 @@ print.epidata_call <- function(x, ...) { )) } -#' Customize fetch settings +#' Set custom API request parameters #' -#' @rdname fetch_args_list -#' @aliases fetch_args -#' -#' @description -#' A constructor for `fetch_args` objects, which are used to pass arguments to -#' the `fetch` function. +#' Used to specify custom options when making API requests, such as to set +#' timeouts or change data formats. These options are used by `fetch()` when it +#' makes calls to the Epidata API. #' #' @param ... not used for values, forces later arguments to bind by name -#' @param fields a list of epidata fields to return, or NULL to return all -#' fields (default) e.g. c("time_value", "value") to return only the -#' time_value and value fields or c("-direction") to return everything except -#' the direction field -#' @param disable_date_parsing disable automatic date parsing; by default `FALSE` -#' @param disable_data_frame_parsing disable automatic conversion to data frame; this -#' is only supported by endpoints that only support the 'classic' format (non-tabular). -#' by default `FALSE` -#' @param return_empty boolean that allows returning an empty tibble if there is no data; -#' by default `FALSE` -#' @param timeout_seconds the maximum amount of time to wait for a response; by default -#' `FALSE` -#' @param base_url base URL to use; by default `NULL`, which means the global base url -#' `"https://api.delphi.cmu.edu/epidata/"` -#' @param dry_run boolean that allows skipping the call to the API and instead -#' returns the `epidata_call` object (useful for debugging); by default `TRUE` -#' @param debug boolean that allows returning the raw response from the API; by default -#' `FALSE` -#' @param format_type the format to request from the API, one of classic, json, csv; this -#' is only used by `fetch_debug`, and by default is `"json"` -#' @return -#' - For `fetch_args_list`: a `fetch_args` object +#' @param fields a list of epidata fields to return, or `NULL` to return all +#' fields (default). e.g. `c("time_value", "value")` to return only the +#' `time_value` and `value` fields or `c("-direction")` to return everything +#' except the direction field +#' @param disable_date_parsing disable automatic date parsing +#' @param disable_data_frame_parsing disable automatic conversion to data frame; +#' this is only supported by endpoints that only support the 'classic' format +#' (non-tabular) +#' @param return_empty boolean that allows returning an empty tibble if there is +#' no data +#' @param timeout_seconds the maximum amount of time (in seconds) to wait for a +#' response from the API server +#' @param base_url base URL to use; by default `NULL`, which means the global +#' base URL `"https://api.delphi.cmu.edu/epidata/"` +#' @param dry_run if `TRUE`, skip the call to the API and instead return the +#' `epidata_call` object (useful for debugging) +#' @param debug if `TRUE`, return the raw response from the API +#' @param format_type the format to request from the API, one of classic, json, +#' csv; this is only used by `fetch_debug`, and by default is `"json"` +#' @return A `fetch_args` object containing all the specified options #' @export -#' +#' @aliases fetch_args #' @importFrom checkmate assert_character assert_logical assert_numeric -#' fetch_args_list <- function( ..., fields = NULL, disable_date_parsing = FALSE, disable_data_frame_parsing = FALSE, return_empty = FALSE, - timeout_seconds = 30, + timeout_seconds = 15 * 60, base_url = NULL, dry_run = FALSE, debug = FALSE, - format_type = "json") { + format_type = c("json", "classic", "csv")) { + rlang::check_dots_empty() + assert_character(fields, null.ok = TRUE, any.missing = FALSE) assert_logical(disable_date_parsing, null.ok = FALSE, len = 1L, any.missing = FALSE) assert_logical(disable_data_frame_parsing, null.ok = FALSE, len = 1L, any.missing = FALSE) @@ -158,8 +179,7 @@ fetch_args_list <- function( assert_character(base_url, null.ok = TRUE, len = 1L, any.missing = FALSE) assert_logical(dry_run, null.ok = FALSE, len = 1L, any.missing = TRUE) assert_logical(debug, null.ok = FALSE, len = 1L, any.missing = FALSE) - assert_character(format_type, null.ok = FALSE, len = 1L, any.missing = FALSE) - assert(format_type %in% c("json", "csv", "classic"), "format_type must be one of json, csv, classic") + format_type <- match.arg(format_type) structure( list( @@ -177,12 +197,20 @@ fetch_args_list <- function( ) } +#' @export +print.fetch_args <- function(x, ...) { + cli::cli_h1(" object:") + # Print all non-class fields. + cli::cli_dl(x[attr(x, "names")]) +} + #' Fetches the data #' #' @details -#' `fetch` usually returns the data in tibble format, but a few of the endpoints -#' only support the JSON classic format (delphi, pvt_meta_norostat, and meta). -#' In that case a JSON-like nested list structure is returned instead. +#' `fetch` usually returns the data in tibble format, but a few of the +#' endpoints only support the JSON classic format (`pub_delphi`, +#' `pvt_meta_norostat`, and `pub_meta`). In that case a +#' JSON-like nested list structure is returned instead. #' #' @rdname epidata_call #' @param epidata_call an instance of `epidata_call` @@ -260,7 +288,7 @@ fetch_classic <- function(epidata_call, fetch_args = fetch_args_list()) { stopifnot(inherits(epidata_call, "epidata_call")) stopifnot(inherits(fetch_args, "fetch_args")) - response_content <- request_impl(epidata_call, "classic", fetch_args$fields, fetch_args$timeout_seconds) %>% + response_content <- request_impl(epidata_call, "classic", fetch_args$timeout_seconds, fetch_args$fields) %>% httr::content(as = "text", encoding = "UTF-8") %>% jsonlite::fromJSON(simplifyDataFrame = !fetch_args$disable_data_frame_parsing) @@ -290,7 +318,7 @@ fetch_debug <- function(epidata_call, fetch_args = fetch_args_list()) { stopifnot(inherits(epidata_call, "epidata_call")) stopifnot(inherits(fetch_args, "fetch_args")) - response <- request_impl(epidata_call, fetch_args$format_type, fetch_args$fields, fetch_args$timeout_seconds) + response <- request_impl(epidata_call, fetch_args$format_type, fetch_args$timeout_seconds, fetch_args$fields) content <- httr::content(response, "text", encoding = "UTF-8") content } @@ -338,7 +366,7 @@ with_base_url <- function(epidata_call, base_url) { #' @importFrom httr stop_for_status content http_type #' @importFrom xml2 read_html xml_find_all xml_text #' @keywords internal -request_impl <- function(epidata_call, format_type, fields = NULL, timeout_seconds = 30) { +request_impl <- function(epidata_call, format_type, timeout_seconds, fields) { stopifnot(inherits(epidata_call, "epidata_call")) stopifnot(format_type %in% c("json", "csv", "classic")) diff --git a/R/epidatr-package.R b/R/epidatr-package.R index 8d272a30..1b22c9e4 100644 --- a/R/epidatr-package.R +++ b/R/epidatr-package.R @@ -1,3 +1,8 @@ +#' @section Package options: +#' +#' The `delphi.epidata.key` option specifies the API key to be used when making +#' requests to the Epidata API. +#' #' @keywords internal #' @include cache.R "_PACKAGE" @@ -6,6 +11,6 @@ cache_environ$use_cache <- Sys.getenv("EPIDATR_USE_CACHE", unset = FALSE) cache_environ$use_cache <- (cache_environ$use_cache == "TRUE") if (cache_environ$use_cache) { - set_cache() + set_cache(startup = TRUE) } } diff --git a/R/model.R b/R/model.R index 34865e91..90bddd51 100644 --- a/R/model.R +++ b/R/model.R @@ -1,12 +1,12 @@ -#' EpiRange +#' Specify a range of days or weeks for API requests #' -#' @description #' Specify a date range (in days or epiweeks) for an API request. #' -#' @param from A `Date`, integer-like value, or integer-like string that takes the -#' form YYYYMMDD for dates or YYYYWW for epiweeks. -#' @param to A `Date`, integer-like value, or integer-like string that takes the -#' form YYYYMMDD for dates or YYYYWW for epiweeks. +#' @param from The first date to request. Can be specified as a `Date` or as an +#' integer or integer-like string in the format YYYYMMDD for dates or YYYYWW +#' for epiweeks. +#' @param to The final date to request (inclusive), specified the same way as +#' `from`. #' @return An `EpiRange` object. #' @importFrom checkmate check_integerish check_character check_date assert #' @@ -61,34 +61,73 @@ epirange <- function(from, to) { structure(list(from = from, to = to), class = "EpiRange") } +#' helper to convert an epirange from week to day or vice versa +#' +#' @keywords internal +reformat_epirange <- function(epirange, to_type = c("day", "week")) { + to_type <- match.arg(to_type) + + # Day format -> week + if (nchar(epirange$from) == 8 && to_type == "week") { + return( + epirange(date_to_epiweek(epirange$from), date_to_epiweek(epirange$to)) + ) + # Week format -> day + } else if (nchar(epirange$from) == 6 && to_type == "day") { + return( + epirange(parse_api_week(epirange$from), parse_api_week(epirange$to)) + ) + } + + return(epirange) +} + +#' @export +print.EpiRange <- function(x, ...) { + if (nchar(x$from) == 8) { + date_type <- "Days" # nolint: object_usage_linter + x$from <- as.Date(as.character(x$from), "%Y%m%d") + x$to <- as.Date(as.character(x$to), "%Y%m%d") + } else if (nchar(x$from) == 6) { + date_type <- "Epiweeks" # nolint: object_usage_linter + x$from <- paste0( + substr(x$from, 1, 4), "w", substr(x$from, 5, 6) + ) + x$to <- paste0( + substr(x$to, 1, 4), "w", substr(x$to, 5, 6) + ) + } -#' Timeset + cli::cli_h1(" object:") + cli::cli_bullets( + "{date_type} from {x$from} to {x$to}" + ) +} + +#' Timeset formats for specifying dates #' -#' @description #' Many API calls accept timesets to specify the time ranges of data being #' requested. Timesets can be specified with `epirange()`, as `Date` objects, or #' with wildcards. #' -#' Timesets are not special R types; the term simply describes any value that -#' would be accepted by epidatr to specify the time value of an epidata query. -#' The allowed values are: +#' Timesets are not special R types; the term simply describes any value that is +#' accepted by epidatr to specify the time value of an epidata query: #' -#' - Dates: `Date` instances, integer-like values, or integer-like strings that -#' take the form YYYYMMDD. -#' - Epiweeks: Integer-like values or integer-like strings that take the form -#' YYYYWW. +#' - Dates: `Date` instances. +#' - Date strings or integers: Strings or integers in the format YYYYMMDD. +#' - Epiweeks: Strings or integers in the format YYYYWW, where WW is the epiweek +#' number. #' - EpiRanges: A range returned by `epirange()`, or a list of multiple ranges. -#' - Wildcard: The string `"*"`, which request all available time values. +#' - Wildcard: The string `"*"`, which requests all available time values. #' -#' Please refer to the specific endpoint documentation for guidance on using -#' dates vs weeks. Most endpoints support only one or the other. Some (less -#' commonly used) endpoints may not accept the `"*"` wildcard, but this can be -#' simulated with a large `epirange()`. +#' Refer to the specific endpoint documentation for guidance on using dates vs +#' weeks. Most endpoints support only one or the other. Some (less commonly +#' used) endpoints may not accept the `"*"` wildcard, but this can be simulated +#' with a large `epirange()`. #' #' @name timeset NULL - create_epidata_field_info <- function(name, type, description = "", @@ -119,19 +158,39 @@ create_epidata_field_info <- function(name, ) } +#' @export +print.EpidataFieldInfo <- function(x, ...) { + cli::cli_h1(" object:") + # Print all non-class fields. + cli::cli_dl(x[attr(x, "names")]) +} + +#' @importFrom stats na.omit parse_value <- function(info, value, disable_date_parsing = FALSE) { stopifnot(inherits(info, "EpidataFieldInfo")) if (is.null(value)) { return(value) - } else if (info$type == "date" && !disable_date_parsing) { + } else if (info$type == "date" && !disable_date_parsing && !inherits(value, "Date")) { return(parse_api_date(value)) - } else if (info$type == "epiweek" && !disable_date_parsing) { + } else if (info$type == "epiweek" && !disable_date_parsing && !inherits(value, "Date")) { return(parse_api_week(value)) } else if (info$type == "bool") { return(as.logical(value)) } else if (info$type == "int") { - return(as.integer(value)) + # Int doesn't have enough capacity to store some weekly `pub_wiki` values. + value <- as.double(value) + if (any(na.omit(value != round(value)))) { + cli::cli_warn( + c( + "Values in {info$name} were expected to be integers but contain a decimal component", + "i" = "Decimal components are returned as-is" + ), + class = "epidatr__int_nonzero_decimal_digits" + ) + } + + return(value) } else if (info$type == "float") { return(as.double(value)) } else if (info$type == "categorical") { @@ -140,13 +199,30 @@ parse_value <- function(info, value, disable_date_parsing = FALSE) { value } +#' @importFrom purrr map_chr parse_data_frame <- function(epidata_call, df, disable_date_parsing = FALSE) { stopifnot(inherits(epidata_call, "epidata_call")) meta <- epidata_call$meta df <- as.data.frame(df) + if (length(meta) == 0) { return(df) } + + meta_field_names <- map_chr(meta, "name") + missing_fields <- setdiff(names(df), meta_field_names) + if ( + length(missing_fields) != 0 + ) { + cli::cli_warn( + c( + "Not all return columns are specified as expected epidata fields", + "i" = "Unspecified fields {missing_fields} may need to be manually converted to more appropriate classes" + ), + class = "epidatr__missing_meta_fields" + ) + } + columns <- colnames(df) for (i in seq_len(length(meta))) { info <- meta[[i]] @@ -157,9 +233,23 @@ parse_data_frame <- function(epidata_call, df, disable_date_parsing = FALSE) { df } +#' Converts a date (integer or character) to an epiweek +#' @param value date (integer or character, with format YYYYMMDD) to be converted to an epiweek +#' @return an integer representing an epiweek, in the format YYYYWW +#' @importFrom MMWRweek MMWRweek +#' @keywords internal +date_to_epiweek <- function(value) { + date_components <- MMWRweek::MMWRweek(as.Date(as.character(value), "%Y%m%d")) + as.numeric(paste0( + date_components$MMWRyear, + # Pad with zeroes up to 2 digits (x -> 0x) + formatC(date_components$MMWRweek, width = 2, flag = 0) + )) +} + #' @keywords internal parse_api_date <- function(value) { - as.Date(as.character(value), format = "%Y%m%d") + as.Date(as.character(value), tryFormats = c("%Y%m%d", "%Y-%m-%d")) } #' parse_api_week converts an integer to a date diff --git a/R/request.R b/R/request.R index 276df8df..603e7bd3 100644 --- a/R/request.R +++ b/R/request.R @@ -22,25 +22,46 @@ join_url <- function(url, endpoint) { #' #' @importFrom httr RETRY #' @keywords internal -do_request <- function(url, params, timeout_seconds = 30) { +do_request <- function(url, params, timeout_seconds) { # don't retry in case of certain status codes - res <- httr::RETRY("GET", - url = url, - query = params, - terminate_on = c(400, 401, 403, 405, 414, 500), - http_headers, - httr::authenticate("epidata", get_auth_key()), - httr::timeout(timeout_seconds) - ) - if (res$status_code == 414) { - res <- httr::RETRY("POST", + key <- get_api_key() + if (key != "") { + res <- httr::RETRY("GET", url = url, - body = params, - encode = "form", + query = params, terminate_on = c(400, 401, 403, 405, 414, 500), http_headers, - httr::authenticate("epidata", get_auth_key()) + httr::authenticate("epidata", get_api_key()), + httr::timeout(timeout_seconds) ) + } else { + res <- httr::RETRY("GET", + url = url, + query = params, + terminate_on = c(400, 401, 403, 405, 414, 500), + http_headers, + httr::timeout(timeout_seconds) + ) + } + if (res$status_code == 414) { + if (key != "") { + res <- httr::RETRY("POST", + url = url, + body = params, + encode = "form", + terminate_on = c(400, 401, 403, 405, 414, 500), + http_headers, + httr::authenticate("epidata", get_api_key()) + ) + } else { + res <- httr::RETRY("POST", + url = url, + body = params, + encode = "form", + terminate_on = c(400, 401, 403, 405, 414, 500), + http_headers + ) + } } res } diff --git a/R/utils.R b/R/utils.R index 3695c501..15356734 100644 --- a/R/utils.R +++ b/R/utils.R @@ -22,15 +22,20 @@ format_list <- function(values) { #' #' @keywords internal check_is_recent <- function(dates, max_age) { - (!is.null(dates) && any(dates >= format(Sys.Date() - max_age, format = "%Y%m%d"))) + if (inherits(dates, "Date")) { + threshold <- Sys.Date() - max_age + } else { + threshold <- format(Sys.Date() - max_age, format = "%Y%m%d") + } + (!is.null(dates) && any(dates >= threshold)) } #' helper that checks whether a call is actually cachable #' #' @keywords internal check_is_cachable <- function(epidata_call, fetch_args) { - as_of_cachable <- (!is.null(epidata_call$params$as_of) && epidata_call$params$as_of != "*") - issues_cachable <- (!is.null(epidata_call$params$issues) && all(epidata_call$params$issues != "*")) + as_of_cachable <- (!is.null(epidata_call$params$as_of) && !identical(epidata_call$params$as_of, "*")) + issues_cachable <- (!is.null(epidata_call$params$issues) && all(!identical(epidata_call$params$issues, "*"))) is_cachable <- ( !is.null(cache_environ$epidatr_cache) && (as_of_cachable || issues_cachable) && @@ -44,3 +49,31 @@ check_is_cachable <- function(epidata_call, fetch_args) { ) return(is_cachable) } + +#' helper to convert a date wildcard ("*") to an appropriate epirange +#' +#' @keywords internal +get_wildcard_equivalent_dates <- function(time_value, time_type = c("day", "week")) { + time_type <- match.arg(time_type) + + if (identical(time_value, "*")) { + if (time_type == "day") { + # To get all dates, set start and end dates to extreme values. + time_value <- epirange(10000101, 30000101) + } else if (time_type == "week") { + time_value <- epirange(100001, 300001) + } + } + return(time_value) +} + +#' inserts each string as a bullet at the end of the "Prepare for release" section +#' @keywords internal +release_bullets <- function() { + c( + "merge to main", + "don't use_version('patch') in the next section", + "`use_version('patch')` is redundant because we do this in PRs", + "`use_dev_version` is also redundant." + ) +} diff --git a/README.Rmd b/README.Rmd new file mode 100644 index 00000000..51f3670c --- /dev/null +++ b/README.Rmd @@ -0,0 +1,123 @@ +--- +output: github_document +--- + + + +```{r, include = FALSE} +knitr::opts_chunk$set( + collapse = TRUE, + comment = "#>", + fig.path = "man/figures/README-", + out.width = "100%" +) +ggplot2::theme_set(ggplot2::theme_bw()) +``` + +# Delphi Epidata R client + + +[![License: MIT][mit-image]][mit-url] [![Github Actions][github-actions-image]][github-actions-url] +[![codecov](https://codecov.io/gh/dsweber2/epidatr/branch/dev/graph/badge.svg?token=jVHL9eHZNZ)](https://app.codecov.io/gh/dsweber2/epidatr) + + +The [Delphi Epidata API](https://cmu-delphi.github.io/delphi-epidata/) provides +real-time access to epidemiological surveillance data for influenza, COVID-19, +and other diseases from both official government sources such as the [Centers +for Disease Control and Prevention +(CDC)](https://www.cdc.gov/datastatistics/index.html), private partners such as +[Facebook (now +Meta)](https://delphi.cmu.edu/blog/2020/08/26/covid-19-symptom-surveys-through-facebook/) +and [Change Healthcare](https://www.changehealthcare.com/), and other public +datasets like [Google +Trends](https://console.cloud.google.com/marketplace/product/bigquery-public-datasets/covid19-search-trends). +It is built and maintained by the Carnegie Mellon University [Delphi Research +Group](https://delphi.cmu.edu/). + +This package is designed to streamline the downloading and usage of data from +the Delphi Epidata API. It provides a simple R interface to the API, including +functions for downloading data, parsing the results, and converting the data +into a tidy format. The API stores a historical record of all data, including +corrections and updates, which is particularly useful for accurately backtesting +forecasting models. We also provide packages for downstream data processing +([epiprocess](https://github.com/cmu-delphi/epiprocess)) and modeling +([epipredict](https://github.com/cmu-delphi/epipredict)). + +## Usage + +```{r, echo=FALSE} +# This is so that if you have USE_EPIDATR_CACHE=TRUE in your .Renviron, the +# startup message does not get included in the README.md when you build this. +suppressPackageStartupMessages(library(epidatr)) +``` + +```{r} +library(epidatr) +# Obtain the smoothed covid-like illness (CLI) signal from Delphi's US COVID-19 +# Trends and Impact Survey (CTIS), in partnership with Facebook, as it was on +# April 10, 2021 for the US at the national level +epidata <- pub_covidcast( + source = "fb-survey", + signals = "smoothed_cli", + geo_type = "nation", + time_type = "day", + geo_values = "us", + time_values = epirange(20210101, 20210601), + as_of = 20210601 +) +epidata +``` + +## Installation + +Installing the package is straightforward. + +```R +# Install the CRAN version +pak::pkg_install("epidatr") +# Install the development version from the GitHub dev branch +pak::pkg_install("cmu-delphi/epidatr@dev") +``` + +### API Keys + +The Delphi API requires a (free) API key for full functionality. To generate +your key, register for a pseudo-anonymous account +[here](https://api.delphi.cmu.edu/epidata/admin/registration_form) and see more +discussion on the [general API +website](https://cmu-delphi.github.io/delphi-epidata/api/api_keys.html). The +`epidatr` client will automatically look for this key in the environment +variable `DELPHI_EPIDATA_KEY`. We recommend storing your key in your `.Renviron` +file, which R will read by default. + +Note that for the time being, the private endpoints (i.e. those prefixed with +`pvt`) will require a separate key that needs to be passed as an argument. + +## For users of the covidcast R package + +The `covidcast` package is deprecated and will no longer be updated. The +`epidatr` package is a complete rewrite of the [`covidcast` +package](https://cmu-delphi.github.io/covidcast/covidcastR/), with a focus on +speed, reliability, and ease of use. It also supports more endpoints and data +sources than `covidcast`. When migrating from that package, you will need to use +the +[`pub_covidcast`](https://cmu-delphi.github.io/epidatr/reference/pub_covidcast.html) +function in `epidatr`. + +## Get updates + +**You should consider subscribing to the [API mailing list](https://lists.andrew.cmu.edu/mailman/listinfo/delphi-covidcast-api)** to be notified of package updates, new data sources, corrections, and other updates. + +## Usage terms and citation + +We request that if you use the `epidatr` package in your work, or use any of the data provided by the Delphi Epidata API through non-`covidcast` endpoints, that you cite us using the citation given by [`citation("epidatr")`](https://cmu-delphi.github.io/epidatr/dev/authors.html#citation). If you use any of the data from the `covidcast` endpoint, please use the [COVIDcast citation](https://cmu-delphi.github.io/covidcast/covidcastR/authors.html#citation) as well. See the [COVIDcast licensing documentation](https://cmu-delphi.github.io/delphi-epidata/api/covidcast_licensing.html) and the [licensing documentation for other endpoints](https://cmu-delphi.github.io/delphi-epidata/api/README.html#data-licensing) for information about citing the datasets provided by the API. + +**Warning:** If you use data from the Epidata API to power a product, dashboard, app, or other service, please download the data you need and store it centrally rather than making API requests for every user. Our server resources are limited and cannot support high-volume interactive use. + +See also the [Terms of Use](https://delphi.cmu.edu/covidcast/terms-of-use/), noting that the data is a research product and not warranted for a particular purpose. + + +[mit-image]: https://img.shields.io/badge/License-MIT-yellow.svg +[mit-url]: https://opensource.org/license/mit +[github-actions-image]: https://github.com/cmu-delphi/epidatr/workflows/ci/badge.svg +[github-actions-url]: https://github.com/cmu-delphi/epidatr/actions diff --git a/README.md b/README.md index 643ec3f0..e849ac2d 100644 --- a/README.md +++ b/README.md @@ -1,18 +1,47 @@ -# Delphi Epidata R client -[![License: MIT][mit-image]][mit-url] [![Github Actions][github-actions-image]][github-actions-url] -[![codecov](https://codecov.io/gh/dsweber2/epidatr/branch/dev/graph/badge.svg?token=jVHL9eHZNZ)](https://app.codecov.io/gh/dsweber2/epidatr) + + +# Delphi Epidata R client -The [Delphi Epidata API](https://cmu-delphi.github.io/delphi-epidata/) provides real-time access to epidemiological surveillance data for influenza, COVID-19, and other diseases for the USA at various geographical resolutions, both from official government sources such as the [Center for Disease Control (CDC)](https://www.cdc.gov/datastatistics/index.html) and [Google Trends](https://cmu-delphi.github.io/delphi-epidata/api/covidcast-signals/google-symptoms.html) and private partners such as [Facebook](https://delphi.cmu.edu/blog/2020/08/26/covid-19-symptom-surveys-through-facebook/) and [Change Healthcare](https://www.changehealthcare.com/). It is built and maintained by the Carnegie Mellon University [Delphi research group](https://delphi.cmu.edu/). + -This package is designed to streamline the downloading and usage of data from the [Delphi Epidata -API](https://cmu-delphi.github.io/delphi-epidata/). It provides a simple R interface to the API, including functions for downloading data, parsing the results, and converting the data into a tidy format. The API stores a historical record of all data, including corrections and updates, which is particularly useful for accurately backtesting forecasting models. We also provide packages for downstream data processing ([epiprocess](https://github.com/cmu-delphi/epiprocess)) and modeling ([epipredict](https://github.com/cmu-delphi/epipredict)). +[![License: +MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/license/mit) +[![Github +Actions](https://github.com/cmu-delphi/epidatr/workflows/ci/badge.svg)](https://github.com/cmu-delphi/epidatr/actions) +[![codecov](https://codecov.io/gh/dsweber2/epidatr/branch/dev/graph/badge.svg?token=jVHL9eHZNZ)](https://app.codecov.io/gh/dsweber2/epidatr) + + +The [Delphi Epidata API](https://cmu-delphi.github.io/delphi-epidata/) +provides real-time access to epidemiological surveillance data for +influenza, COVID-19, and other diseases from both official government +sources such as the [Centers for Disease Control and Prevention +(CDC)](https://www.cdc.gov/datastatistics/index.html), private partners +such as [Facebook (now +Meta)](https://delphi.cmu.edu/blog/2020/08/26/covid-19-symptom-surveys-through-facebook/) +and [Change Healthcare](https://www.changehealthcare.com/), and other +public datasets like [Google +Trends](https://console.cloud.google.com/marketplace/product/bigquery-public-datasets/covid19-search-trends). +It is built and maintained by the Carnegie Mellon University [Delphi +Research Group](https://delphi.cmu.edu/). + +This package is designed to streamline the downloading and usage of data +from the Delphi Epidata API. It provides a simple R interface to the +API, including functions for downloading data, parsing the results, and +converting the data into a tidy format. The API stores a historical +record of all data, including corrections and updates, which is +particularly useful for accurately backtesting forecasting models. We +also provide packages for downstream data processing +([epiprocess](https://github.com/cmu-delphi/epiprocess)) and modeling +([epipredict](https://github.com/cmu-delphi/epipredict)). ## Usage -```R +``` r library(epidatr) -# Obtain the smoothed covid-like illness (CLI) signal from the Facebook survey as it was on April 10, 2021 for the US +# Obtain the smoothed covid-like illness (CLI) signal from Delphi's US COVID-19 +# Trends and Impact Survey (CTIS), in partnership with Facebook, as it was on +# April 10, 2021 for the US at the national level epidata <- pub_covidcast( source = "fb-survey", signals = "smoothed_cli", @@ -20,76 +49,92 @@ epidata <- pub_covidcast( time_type = "day", geo_values = "us", time_values = epirange(20210101, 20210601), - as_of = "2021-06-01" + as_of = 20210601 ) epidata +#> # A tibble: 151 × 15 +#> geo_value signal source geo_type time_type time_value direction issue +#> +#> 1 us smoothed… fb-su… nation day 2021-01-01 NA 2021-01-06 +#> 2 us smoothed… fb-su… nation day 2021-01-02 NA 2021-01-07 +#> 3 us smoothed… fb-su… nation day 2021-01-03 NA 2021-01-08 +#> 4 us smoothed… fb-su… nation day 2021-01-04 NA 2021-01-09 +#> 5 us smoothed… fb-su… nation day 2021-01-05 NA 2021-01-10 +#> 6 us smoothed… fb-su… nation day 2021-01-06 NA 2021-01-29 +#> 7 us smoothed… fb-su… nation day 2021-01-07 NA 2021-01-29 +#> 8 us smoothed… fb-su… nation day 2021-01-08 NA 2021-01-29 +#> 9 us smoothed… fb-su… nation day 2021-01-09 NA 2021-01-29 +#> 10 us smoothed… fb-su… nation day 2021-01-10 NA 2021-01-29 +#> # ℹ 141 more rows +#> # ℹ 7 more variables: lag , missing_value , missing_stderr , +#> # missing_sample_size , value , stderr , sample_size ``` -``` -# A tibble: 6 × 15 - geo_value signal source geo_type time_type time_value - -1 us smoothed_cli fb-surv… nation day 2021-04-05 -2 us smoothed_cli fb-surv… nation day 2021-04-06 -3 us smoothed_cli fb-surv… nation day 2021-04-07 -4 us smoothed_cli fb-surv… nation day 2021-04-08 -5 us smoothed_cli fb-surv… nation day 2021-04-09 -6 us smoothed_cli fb-surv… nation day 2021-04-10 -# ℹ 9 more variables: direction , issue , -# lag , missing_value , missing_stderr , -# missing_sample_size , value , stderr , -# sample_size -``` - -```r -# Plot this data -library(ggplot2) -ggplot(epidata, aes(x = time_value, y = value)) + - geom_line() + - labs(title = "Smoothed CLI from Facebook Survey", - subtitle = "US, 2021", - x = "Date", - y = "CLI") -``` - -![Smoothed CLI from Facebook Survey](man/figures/fb-cli-signal.png) - ## Installation -Install from GitHub: +Installing the package is straightforward. -```R -# Install the dev version using `pak` or `remotes` -pak::pkg_install("cmu-delphi/epidatr") -remotes::install_github("cmu-delphi/epidatr") +``` r +# Install the CRAN version +pak::pkg_install("epidatr") +# Install the development version from the GitHub dev branch +pak::pkg_install("cmu-delphi/epidatr@dev") ``` -CRAN version coming soon. - ### API Keys -The Delphi API requires a (free) API key for full functionality. To generate -your key, register for a pseudo-anonymous account -[here](https://api.delphi.cmu.edu/epidata/admin/registration_form) and see more -discussion on the [general API -website](https://cmu-delphi.github.io/delphi-epidata/api/api_keys.html). The -`epidatr` client will automatically look for this key in the R option -`delphi.epidata.key` or in the environment variable -`DELPHI_EPIDATA_KEY`. We recommend storing your key in `.Renviron` file, which R -will read by default. - -Note that for the time being, the private endpoints (i.e. those prefixed with -`pvt`) will require a separate key that needs to be passed as an argument. - -[mit-image]: https://img.shields.io/badge/License-MIT-yellow.svg -[mit-url]: https://opensource.org/license/mit/ -[github-actions-image]: https://github.com/cmu-delphi/epidatr/workflows/ci/badge.svg -[github-actions-url]: https://github.com/cmu-delphi/epidatr/actions +The Delphi API requires a (free) API key for full functionality. To +generate your key, register for a pseudo-anonymous account +[here](https://api.delphi.cmu.edu/epidata/admin/registration_form) and +see more discussion on the [general API +website](https://cmu-delphi.github.io/delphi-epidata/api/api_keys.html). +The `epidatr` client will automatically look for this key in the +environment variable `DELPHI_EPIDATA_KEY`. We recommend storing your key +in your `.Renviron` file, which R will read by default. + +Note that for the time being, the private endpoints (i.e. those prefixed +with `pvt`) will require a separate key that needs to be passed as an +argument. + +## For users of the covidcast R package + +The `covidcast` package is deprecated and will no longer be updated. The +`epidatr` package is a complete rewrite of the [`covidcast` +package](https://cmu-delphi.github.io/covidcast/covidcastR/), with a +focus on speed, reliability, and ease of use. It also supports more +endpoints and data sources than `covidcast`. When migrating from that +package, you will need to use the +[`pub_covidcast`](https://cmu-delphi.github.io/epidatr/reference/pub_covidcast.html) +function in `epidatr`. ## Get updates -You should consider subscribing to the [API mailing list](https://lists.andrew.cmu.edu/mailman/listinfo/delphi-covidcast-api) to be notified of package updates, new data sources, corrections, and other updates. - -## For users of the `covidcast` R package - -The `epidatr` package is a complete rewrite of the [`covidcast` package](https://cmu-delphi.github.io/covidcast/covidcastR/), with a focus on speed, reliability, and ease of use. The `covidcast` package is deprecated and will no longer be updated. +**You should consider subscribing to the [API mailing +list](https://lists.andrew.cmu.edu/mailman/listinfo/delphi-covidcast-api)** +to be notified of package updates, new data sources, corrections, and +other updates. + +## Usage terms and citation + +We request that if you use the `epidatr` package in your work, or use +any of the data provided by the Delphi Epidata API through +non-`covidcast` endpoints, that you cite us using the citation given by +[`citation("epidatr")`](https://cmu-delphi.github.io/epidatr/dev/authors.html#citation). +If you use any of the data from the `covidcast` endpoint, please use the +[COVIDcast +citation](https://cmu-delphi.github.io/covidcast/covidcastR/authors.html#citation) +as well. See the [COVIDcast licensing +documentation](https://cmu-delphi.github.io/delphi-epidata/api/covidcast_licensing.html) +and the [licensing documentation for other +endpoints](https://cmu-delphi.github.io/delphi-epidata/api/README.html#data-licensing) +for information about citing the datasets provided by the API. + +**Warning:** If you use data from the Epidata API to power a product, +dashboard, app, or other service, please download the data you need and +store it centrally rather than making API requests for every user. Our +server resources are limited and cannot support high-volume interactive +use. + +See also the [Terms of +Use](https://delphi.cmu.edu/covidcast/terms-of-use/), noting that the +data is a research product and not warranted for a particular purpose. diff --git a/_pkgdown.yml b/_pkgdown.yml index 7b5c1c3b..98124004 100644 --- a/_pkgdown.yml +++ b/_pkgdown.yml @@ -1,38 +1,68 @@ +# Colors should stay consistent across epipredict & epidatr, using Carnegie +# Red https://www.cmu.edu/brand/brand-guidelines/visual-identity/colors.html + +# This is to give a default value to the `mode` parameter in the +# `pkgdown::build_site` function. This is useful when building the site locally, +# as it will default to `devel` mode. In practice, this should all be handled +# dynamically by the CI/CD pipeline. +development: + mode: devel + version_label: success + +template: + bootstrap: 5 + bootswatch: cosmo + bslib: + font_scale: 1.0 + primary: "#C41230" + link-color: "#C41230" + +navbar: + bg: primary + type: dark + home: links: - text: Get the Python client href: https://github.com/cmu-delphi/epidatpy/ - - text: View the Delphi Website href: https://delphi.cmu.edu/ + - text: Introduction to Delphi's Tooling Work + href: https://cmu-delphi.github.io/delphi-tooling-book/ + - text: The epiprocess R package + href: https://cmu-delphi.github.io/epiprocess/ + - text: The epipredict R package + href: https://cmu-delphi.github.io/epipredict/ + - text: The epidatasets R package + href: https://cmu-delphi.github.io/epidatasets/ reference: + - title: Data source and signal discovery + desc: Quickly explore endpoints, and API signal and source names + - contents: + - avail_endpoints + - covidcast_epidata + - title: Make API requests + desc: Query Delphi Epidata endpoints + - contents: + - epidata_call + - fetch_args_list + - has_keyword("endpoint") + - -starts_with("pvt_") - title: Configuration and utilities desc: Set API keys and handle API data types - contents: - - get_auth_key - - avail_endpoints + - get_api_key - epirange - timeset - - title: Control Caching behavior + - title: Control caching behavior desc: Configure an optional persistent cache - contents: - set_cache - clear_cache - disable_cache - cache_info - - title: Make API requests - desc: Query Delphi Epidata endpoints - - contents: - - epidata_call - - fetch_args_list - - has_keyword("endpoint") - - -starts_with("pvt_") - title: Make requests to private API endpoints desc: These endpoints require additional authorization to use - contents: - starts_with("pvt_") - - title: Autocomplete helpers - desc: Objects that can autocomplete API signals names for faster exploration - - contents: - - covidcast_epidata diff --git a/man/avail_endpoints.Rd b/man/avail_endpoints.Rd index f669cd22..9a6cb0ce 100644 --- a/man/avail_endpoints.Rd +++ b/man/avail_endpoints.Rd @@ -2,17 +2,19 @@ % Please edit documentation in R/avail_endpoints.R \name{avail_endpoints} \alias{avail_endpoints} -\title{List all available endpoints.} +\title{List all available Epidata API endpoints} \usage{ avail_endpoints() } \value{ -A \code{\link[tibble:tibble]{tibble::tibble}}. +A \code{\link[tibble:tibble]{tibble::tibble}} of endpoints, with two columns: +\item{Endpoint}{Name of the function for accessing this API endpoint.} +\item{Description}{One-sentence description of the data available at the +endpoint.} } \description{ -A function that prints a tibble with two columns: \code{Endpoint} contains the -function for accessing the Delphi Epidata API endpoint along with a -\code{Description}. +Fetches a data frame of all Epidata API endpoints that can be accessed using +this package, with a brief description. } \examples{ avail_endpoints() diff --git a/man/clear_cache.Rd b/man/clear_cache.Rd index c377c612..f5d232b9 100644 --- a/man/clear_cache.Rd +++ b/man/clear_cache.Rd @@ -4,19 +4,16 @@ \alias{clear_cache} \title{Manually reset the cache, deleting all currently saved data and starting afresh} \usage{ -clear_cache(disable = FALSE, ...) +clear_cache(..., disable = FALSE) } \arguments{ -\item{disable}{instead of setting a new cache, disable caching entirely; -defaults to \code{FALSE}} - \item{...}{ Arguments passed on to \code{\link[=set_cache]{set_cache}} \describe{ \item{\code{cache_dir}}{the directory in which the cache is stored. By default, this -is \code{tools::R_user_dir()} if on R 4.0+, but must be specified for earlier -versions of R. The path can be either relative or absolute. The -environmental variable is \code{EPIDATR_CACHE_DIR}.} +is \code{rappdirs::user_cache_dir("R", version = "epidatr")}. The path can be +either relative or absolute. The environmental variable is +\code{EPIDATR_CACHE_DIR}.} \item{\code{days}}{the maximum length of time in days to keep any particular cached call. By default this is \code{1}. The environmental variable is \code{EPIDATR_CACHE_MAX_AGE_DAYS}.} @@ -28,7 +25,12 @@ cache directory. By default, it is \code{"logfile.txt"}. The environmental variable is \code{EPIDATR_CACHE_LOGFILE}.} \item{\code{confirm}}{whether to confirm directory creation. default is \code{TRUE}; should only be set in non-interactive scripts} + \item{\code{startup}}{indicates whether the function is being called on +startup. Affects suppressability of the messages. Default is \code{FALSE}.} }} + +\item{disable}{instead of setting a new cache, disable caching entirely; +defaults to \code{FALSE}} } \value{ \code{\link{NULL}} no return value, all effects are stored in the package diff --git a/man/covidcast_epidata.Rd b/man/covidcast_epidata.Rd index 2ab9fd75..9fe31718 100644 --- a/man/covidcast_epidata.Rd +++ b/man/covidcast_epidata.Rd @@ -56,7 +56,7 @@ to access them we rely on the backtick operator: }\if{html}{\out{}} These objects can be used directly to fetch data, without requiring us to use -the \code{covidcast()} function. Simply use the \verb{$call} attribute of the object: +the \code{pub_covidcast()} function. Simply use the \verb{$call} attribute of the object: \if{html}{\out{
}}\preformatted{epidata$signals$`fb-survey:smoothed_cli`$call("state", "pa", epirange(20210405, 20210410)) @@ -69,7 +69,7 @@ the \code{covidcast()} function. Simply use the \verb{$call} attribute of the ob #> 4 pa smoothed_~ fb-su~ state day 2021-04-08 NA 2021-04-13 #> 5 pa smoothed_~ fb-su~ state day 2021-04-09 NA 2021-04-14 #> 6 pa smoothed_~ fb-su~ state day 2021-04-10 NA 2021-04-15 -#> # i 7 more variables: lag , missing_value , missing_stderr , -#> # missing_sample_size , value , stderr , sample_size +#> # i 7 more variables: lag , missing_value , missing_stderr , +#> # missing_sample_size , value , stderr , sample_size }\if{html}{\out{
}} } diff --git a/man/date_to_epiweek.Rd b/man/date_to_epiweek.Rd new file mode 100644 index 00000000..7f1f4262 --- /dev/null +++ b/man/date_to_epiweek.Rd @@ -0,0 +1,18 @@ +% Generated by roxygen2: do not edit by hand +% Please edit documentation in R/model.R +\name{date_to_epiweek} +\alias{date_to_epiweek} +\title{Converts a date (integer or character) to an epiweek} +\usage{ +date_to_epiweek(value) +} +\arguments{ +\item{value}{date (integer or character, with format YYYYMMDD) to be converted to an epiweek} +} +\value{ +an integer representing an epiweek, in the format YYYYWW +} +\description{ +Converts a date (integer or character) to an epiweek +} +\keyword{internal} diff --git a/man/do_request.Rd b/man/do_request.Rd index 7add7b85..e5cd7995 100644 --- a/man/do_request.Rd +++ b/man/do_request.Rd @@ -4,7 +4,7 @@ \alias{do_request} \title{performs the request} \usage{ -do_request(url, params, timeout_seconds = 30) +do_request(url, params, timeout_seconds) } \description{ You can test the authentication headers like so: diff --git a/man/epidata_call.Rd b/man/epidata_call.Rd index dab13c9c..c2ef4b6b 100644 --- a/man/epidata_call.Rd +++ b/man/epidata_call.Rd @@ -41,8 +41,8 @@ fetch(epidata_call, fetch_args = fetch_args_list()) \code{epidata_call} objects are generated internally by endpoint functions like \code{\link{pub_covidcast}}; by default, they are piped directly into the \code{fetch} function to fetch and format the data. For most endpoints this will return -a tibble, but a few non-COVIDCAST endpoints only support will return a -JSON-like list instead. +a tibble, but a few non-COVIDCAST endpoints will return a JSON-like list +instead. } \details{ \code{create_epidata_call} is the constructor for \code{epidata_call} objects, but you @@ -54,9 +54,10 @@ There are some other functions available for debugging and advanced usage: - \code{request_url} (for debugging): outputs the request URL from which data would be fetched (note additional parameters below) -\code{fetch} usually returns the data in tibble format, but a few of the endpoints -only support the JSON classic format (delphi, pvt_meta_norostat, and meta). -In that case a JSON-like nested list structure is returned instead. +\code{fetch} usually returns the data in tibble format, but a few of the +endpoints only support the JSON classic format (\code{pub_delphi}, +\code{pvt_meta_norostat}, and \code{pub_meta}). In that case a +JSON-like nested list structure is returned instead. } \examples{ \dontrun{ diff --git a/man/epidatr-package.Rd b/man/epidatr-package.Rd index b2e49714..9521ea06 100644 --- a/man/epidatr-package.Rd +++ b/man/epidatr-package.Rd @@ -8,6 +8,13 @@ \description{ The Delphi 'Epidata' API provides real-time access to epidemiological surveillance data for influenza, 'COVID-19', and other diseases for the USA at various geographical resolutions, both from official government sources such as the Center for Disease Control (CDC) and Google Trends and private partners such as Facebook and Change 'Healthcare'. It is built and maintained by the Carnegie Mellon University Delphi research group. To cite this API: David C. Farrow, Logan C. Brooks, Aaron 'Rumack', Ryan J. 'Tibshirani', 'Roni' 'Rosenfeld' (2015). Delphi 'Epidata' API. \url{https://github.com/cmu-delphi/delphi-epidata}. } +\section{Package options}{ + + +The \code{delphi.epidata.key} option specifies the API key to be used when making +requests to the Epidata API. +} + \seealso{ Useful links: \itemize{ diff --git a/man/epirange.Rd b/man/epirange.Rd index 1f4605e6..0fba2433 100644 --- a/man/epirange.Rd +++ b/man/epirange.Rd @@ -2,16 +2,17 @@ % Please edit documentation in R/model.R \name{epirange} \alias{epirange} -\title{EpiRange} +\title{Specify a range of days or weeks for API requests} \usage{ epirange(from, to) } \arguments{ -\item{from}{A \code{Date}, integer-like value, or integer-like string that takes the -form YYYYMMDD for dates or YYYYWW for epiweeks.} +\item{from}{The first date to request. Can be specified as a \code{Date} or as an +integer or integer-like string in the format YYYYMMDD for dates or YYYYWW +for epiweeks.} -\item{to}{A \code{Date}, integer-like value, or integer-like string that takes the -form YYYYMMDD for dates or YYYYWW for epiweeks.} +\item{to}{The final date to request (inclusive), specified the same way as +\code{from}.} } \value{ An \code{EpiRange} object. diff --git a/man/fetch_args_list.Rd b/man/fetch_args_list.Rd index e33de228..ca6f7dcf 100644 --- a/man/fetch_args_list.Rd +++ b/man/fetch_args_list.Rd @@ -3,7 +3,7 @@ \name{fetch_args_list} \alias{fetch_args_list} \alias{fetch_args} -\title{Customize fetch settings} +\title{Set custom API request parameters} \usage{ fetch_args_list( ..., @@ -11,51 +11,49 @@ fetch_args_list( disable_date_parsing = FALSE, disable_data_frame_parsing = FALSE, return_empty = FALSE, - timeout_seconds = 30, + timeout_seconds = 15 * 60, base_url = NULL, dry_run = FALSE, debug = FALSE, - format_type = "json" + format_type = c("json", "classic", "csv") ) } \arguments{ \item{...}{not used for values, forces later arguments to bind by name} -\item{fields}{a list of epidata fields to return, or NULL to return all -fields (default) e.g. c("time_value", "value") to return only the -time_value and value fields or c("-direction") to return everything except -the direction field} +\item{fields}{a list of epidata fields to return, or \code{NULL} to return all +fields (default). e.g. \code{c("time_value", "value")} to return only the +\code{time_value} and \code{value} fields or \code{c("-direction")} to return everything +except the direction field} -\item{disable_date_parsing}{disable automatic date parsing; by default \code{FALSE}} +\item{disable_date_parsing}{disable automatic date parsing} -\item{disable_data_frame_parsing}{disable automatic conversion to data frame; this -is only supported by endpoints that only support the 'classic' format (non-tabular). -by default \code{FALSE}} +\item{disable_data_frame_parsing}{disable automatic conversion to data frame; +this is only supported by endpoints that only support the 'classic' format +(non-tabular)} -\item{return_empty}{boolean that allows returning an empty tibble if there is no data; -by default \code{FALSE}} +\item{return_empty}{boolean that allows returning an empty tibble if there is +no data} -\item{timeout_seconds}{the maximum amount of time to wait for a response; by default -\code{FALSE}} +\item{timeout_seconds}{the maximum amount of time (in seconds) to wait for a +response from the API server} -\item{base_url}{base URL to use; by default \code{NULL}, which means the global base url -\code{"https://api.delphi.cmu.edu/epidata/"}} +\item{base_url}{base URL to use; by default \code{NULL}, which means the global +base URL \code{"https://api.delphi.cmu.edu/epidata/"}} -\item{dry_run}{boolean that allows skipping the call to the API and instead -returns the \code{epidata_call} object (useful for debugging); by default \code{TRUE}} +\item{dry_run}{if \code{TRUE}, skip the call to the API and instead return the +\code{epidata_call} object (useful for debugging)} -\item{debug}{boolean that allows returning the raw response from the API; by default -\code{FALSE}} +\item{debug}{if \code{TRUE}, return the raw response from the API} -\item{format_type}{the format to request from the API, one of classic, json, csv; this -is only used by \code{fetch_debug}, and by default is \code{"json"}} +\item{format_type}{the format to request from the API, one of classic, json, +csv; this is only used by \code{fetch_debug}, and by default is \code{"json"}} } \value{ -\itemize{ -\item For \code{fetch_args_list}: a \code{fetch_args} object -} +A \code{fetch_args} object containing all the specified options } \description{ -A constructor for \code{fetch_args} objects, which are used to pass arguments to -the \code{fetch} function. +Used to specify custom options when making API requests, such as to set +timeouts or change data formats. These options are used by \code{fetch()} when it +makes calls to the Epidata API. } diff --git a/man/figures/README-fb-cli-signal-1.png b/man/figures/README-fb-cli-signal-1.png new file mode 100644 index 00000000..21c040f1 Binary files /dev/null and b/man/figures/README-fb-cli-signal-1.png differ diff --git a/man/get_api_key.Rd b/man/get_api_key.Rd new file mode 100644 index 00000000..2fd9b1b7 --- /dev/null +++ b/man/get_api_key.Rd @@ -0,0 +1,42 @@ +% Generated by roxygen2: do not edit by hand +% Please edit documentation in R/auth.R +\name{get_api_key} +\alias{get_api_key} +\alias{save_api_key} +\title{Get and set API keys} +\usage{ +get_api_key() + +save_api_key() +} +\value{ +For \code{get_api_key()}, returns the current API key as a string, or +\code{""} if none is set. +} +\description{ +Get and set the API key used to make requests to the Epidata API. Without a +key, requests may be subject to rate limits and other limitations. +} +\details{ +We recommend you register for an API key. While most endpoints are available +without one, there are \href{https://cmu-delphi.github.io/delphi-epidata/api/api_keys.html}{limits on API usage for anonymous users}, +including a rate limit. If you regularly request large amounts of data, +please consider \href{https://api.delphi.cmu.edu/epidata/admin/registration_form}{registering for an API key}. + +API keys are strings read from the environment variable \code{DELPHI_EPIDATA_KEY}. +We recommend setting your key with \code{save_api_key()}, which will modify an +applicable \code{.Renviron} file, which will be read in automatically when you +start future R sessions (see \code{\link[base:Startup]{?Startup}} for details on +\code{.Renviron} files). Alternatively, you can modify the environment variable at +the command line before/while launching R, or inside an R session with +\code{\link[=Sys.setenv]{Sys.setenv()}}, but these will not persist across sessions. + +Once an API key is set, it is automatically used for all requests made by +functions in this package. +} +\references{ +\itemize{ +\item \href{https://cmu-delphi.github.io/delphi-epidata/api/api_keys.html}{Delphi Epidata API Keys documentation}. +\item \href{https://api.delphi.cmu.edu/epidata/admin/registration_form}{Delphi Epidata API Registration Form}. +} +} diff --git a/man/get_auth_key.Rd b/man/get_auth_key.Rd deleted file mode 100644 index 65808781..00000000 --- a/man/get_auth_key.Rd +++ /dev/null @@ -1,15 +0,0 @@ -% Generated by roxygen2: do not edit by hand -% Please edit documentation in R/auth.R -\name{get_auth_key} -\alias{get_auth_key} -\title{Getting the API key} -\usage{ -get_auth_key() -} -\value{ -The API key as a string or "". -} -\description{ -Get the API key from the environment variable \code{DELPHI_EPIDATA_KEY} or -\code{getOption("delphi.epidata.key")}. -} diff --git a/man/get_wildcard_equivalent_dates.Rd b/man/get_wildcard_equivalent_dates.Rd new file mode 100644 index 00000000..590a4745 --- /dev/null +++ b/man/get_wildcard_equivalent_dates.Rd @@ -0,0 +1,12 @@ +% Generated by roxygen2: do not edit by hand +% Please edit documentation in R/utils.R +\name{get_wildcard_equivalent_dates} +\alias{get_wildcard_equivalent_dates} +\title{helper to convert a date wildcard ("*") to an appropriate epirange} +\usage{ +get_wildcard_equivalent_dates(time_value, time_type = c("day", "week")) +} +\description{ +helper to convert a date wildcard ("*") to an appropriate epirange +} +\keyword{internal} diff --git a/man/pub_covid_hosp_facility.Rd b/man/pub_covid_hosp_facility.Rd index df7d4d9a..59f4ff9b 100644 --- a/man/pub_covid_hosp_facility.Rd +++ b/man/pub_covid_hosp_facility.Rd @@ -2,11 +2,11 @@ % Please edit documentation in R/endpoints.R \name{pub_covid_hosp_facility} \alias{pub_covid_hosp_facility} -\title{COVID hospitalization data for specific facilities} +\title{COVID hospitalizations by facility} \usage{ pub_covid_hosp_facility( hospital_pks, - collection_weeks, + collection_weeks = "*", ..., publication_dates = NULL, fetch_args = fetch_args_list() @@ -15,7 +15,8 @@ pub_covid_hosp_facility( \arguments{ \item{hospital_pks}{character. Facility identifiers.} -\item{collection_weeks}{\code{\link{timeset}}. Epiweeks to fetch.} +\item{collection_weeks}{\code{\link{timeset}}. Dates (corresponding to epiweeks) to +fetch. Defaults to all ("*") dates.} \item{...}{not used for values, forces later arguments to bind by name} @@ -45,6 +46,11 @@ pub_covid_hosp_facility( hospital_pks = "100075", collection_weeks = epirange(20200101, 20200501) ) + +pub_covid_hosp_facility( + hospital_pks = "100075", + collection_weeks = epirange(202001, 202005) +) } } \seealso{ diff --git a/man/pub_covid_hosp_facility_lookup.Rd b/man/pub_covid_hosp_facility_lookup.Rd index 88b5d93d..718d153b 100644 --- a/man/pub_covid_hosp_facility_lookup.Rd +++ b/man/pub_covid_hosp_facility_lookup.Rd @@ -2,7 +2,7 @@ % Please edit documentation in R/endpoints.R \name{pub_covid_hosp_facility_lookup} \alias{pub_covid_hosp_facility_lookup} -\title{COVID hospitalization facility identifiers} +\title{Helper for finding COVID hospitalization facilities} \usage{ pub_covid_hosp_facility_lookup( ..., diff --git a/man/pub_covid_hosp_state_timeseries.Rd b/man/pub_covid_hosp_state_timeseries.Rd index e032314f..246bf7b1 100644 --- a/man/pub_covid_hosp_state_timeseries.Rd +++ b/man/pub_covid_hosp_state_timeseries.Rd @@ -2,12 +2,13 @@ % Please edit documentation in R/endpoints.R \name{pub_covid_hosp_state_timeseries} \alias{pub_covid_hosp_state_timeseries} -\title{COVID Hospitalization Data by State} +\title{COVID hospitalizations by state} \usage{ pub_covid_hosp_state_timeseries( states, - dates, + dates = "*", ..., + as_of = NULL, issues = NULL, fetch_args = fetch_args_list() ) @@ -15,12 +16,17 @@ pub_covid_hosp_state_timeseries( \arguments{ \item{states}{character. Two letter state abbreviations.} -\item{dates}{\code{\link{timeset}}. Dates to fetch.} +\item{dates}{\code{\link{timeset}}. Dates to fetch. Defaults to all ("*") dates.} \item{...}{not used for values, forces later arguments to bind by name} -\item{issues}{\code{\link{timeset}}. Optionally, the issues to fetch. If not set, the -most recent issue is returned.} +\item{as_of}{Date. Optionally, the as of date for the issues to fetch. If not +specified, the most recent data is returned. Mutually exclusive with +\code{issues}.} + +\item{issues}{\code{\link{timeset}}. Optionally, the issue of the data to fetch. If not +specified, the most recent issue is returned. Mutually exclusive with +\code{as_of} or \code{lag}.} \item{fetch_args}{\code{\link{fetch_args}}. Additional arguments to pass to \code{fetch()}.} } diff --git a/man/pub_covidcast.Rd b/man/pub_covidcast.Rd index c530bc03..65fb736f 100644 --- a/man/pub_covidcast.Rd +++ b/man/pub_covidcast.Rd @@ -2,15 +2,15 @@ % Please edit documentation in R/endpoints.R \name{pub_covidcast} \alias{pub_covidcast} -\title{COVID data via the covidcast endpoint} +\title{Various COVID and flu signals via the COVIDcast endpoint} \usage{ pub_covidcast( source, signals, geo_type, time_type, - geo_values, - time_values, + geo_values = "*", + time_values = "*", ..., as_of = NULL, issues = NULL, @@ -35,7 +35,7 @@ pub_covidcast( all. (See: \url{https://cmu-delphi.github.io/delphi-epidata/api/covidcast_geography.html}.)} -\item{time_values}{\code{\link{timeset}}. Dates to fetch.} +\item{time_values}{\code{\link{timeset}}. Dates to fetch. Defaults to all ("*") dates.} \item{...}{not used for values, forces later arguments to bind by name} diff --git a/man/pub_delphi.Rd b/man/pub_delphi.Rd index 83658abf..fe278beb 100644 --- a/man/pub_delphi.Rd +++ b/man/pub_delphi.Rd @@ -2,14 +2,15 @@ % Please edit documentation in R/endpoints.R \name{pub_delphi} \alias{pub_delphi} -\title{Delphi's ILINet forecasts} +\title{Delphi's ILINet outpatient doctor visits forecasts} \usage{ pub_delphi(system, epiweek, fetch_args = fetch_args_list()) } \arguments{ \item{system}{character. System name to fetch.} -\item{epiweek}{\code{\link{timeset}}. Epiweeks to fetch.} +\item{epiweek}{\code{\link{timeset}}. Epiweek to fetch. Does not support multiple dates. +Make separate calls to fetch data for multiple epiweeks.} \item{fetch_args}{\code{\link{fetch_args}}. Additional arguments to pass to \code{fetch()}.} } diff --git a/man/pub_dengue_nowcast.Rd b/man/pub_dengue_nowcast.Rd index 8bfa5c37..e1c2573c 100644 --- a/man/pub_dengue_nowcast.Rd +++ b/man/pub_dengue_nowcast.Rd @@ -2,14 +2,14 @@ % Please edit documentation in R/endpoints.R \name{pub_dengue_nowcast} \alias{pub_dengue_nowcast} -\title{Delphi's PAHO Dengue nowcast} +\title{Delphi's PAHO dengue nowcasts (North and South America)} \usage{ -pub_dengue_nowcast(locations, epiweeks, fetch_args = fetch_args_list()) +pub_dengue_nowcast(locations, epiweeks = "*", fetch_args = fetch_args_list()) } \arguments{ \item{locations}{character. Locations to fetch.} -\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch.} +\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch. Defaults to all ("*") dates.} \item{fetch_args}{\code{\link{fetch_args}}. Additional arguments to pass to \code{fetch()}.} } diff --git a/man/pub_ecdc_ili.Rd b/man/pub_ecdc_ili.Rd index 85e5f789..d71b5651 100644 --- a/man/pub_ecdc_ili.Rd +++ b/man/pub_ecdc_ili.Rd @@ -2,11 +2,11 @@ % Please edit documentation in R/endpoints.R \name{pub_ecdc_ili} \alias{pub_ecdc_ili} -\title{ECDC ILI data} +\title{ECDC ILI incidence (Europe)} \usage{ pub_ecdc_ili( regions, - epiweeks, + epiweeks = "*", ..., issues = NULL, lag = NULL, @@ -16,7 +16,7 @@ pub_ecdc_ili( \arguments{ \item{regions}{character. Regions to fetch.} -\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch.} +\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch. Defaults to all ("*") dates.} \item{...}{not used for values, forces later arguments to bind by name} diff --git a/man/pub_flusurv.Rd b/man/pub_flusurv.Rd index 4936499f..e8fd5bb0 100644 --- a/man/pub_flusurv.Rd +++ b/man/pub_flusurv.Rd @@ -2,11 +2,11 @@ % Please edit documentation in R/endpoints.R \name{pub_flusurv} \alias{pub_flusurv} -\title{FluSurv hospitalization data} +\title{CDC FluSurv flu hospitalizations} \usage{ pub_flusurv( locations, - epiweeks, + epiweeks = "*", ..., issues = NULL, lag = NULL, @@ -16,7 +16,7 @@ pub_flusurv( \arguments{ \item{locations}{character. Character vector indicating location.} -\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch.} +\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch. Defaults to all ("*") dates.} \item{...}{not used for values, forces later arguments to bind by name} @@ -34,7 +34,7 @@ the most recent issue is returned. Mutually exclusive with \code{issues}.} \description{ API docs: \url{https://cmu-delphi.github.io/delphi-epidata/api/flusurv.html}. -Obtain information on flu hospitalization rates from the Center of Disease +Obtain information on influenza hospitalization rates from the Center of Disease Control. See also \url{https://gis.cdc.gov/GRASP/Fluview/FluHospRates.html}. diff --git a/man/pub_fluview.Rd b/man/pub_fluview.Rd index 6dd15c31..61ba357a 100644 --- a/man/pub_fluview.Rd +++ b/man/pub_fluview.Rd @@ -2,11 +2,11 @@ % Please edit documentation in R/endpoints.R \name{pub_fluview} \alias{pub_fluview} -\title{FluView ILINet data} +\title{CDC FluView ILINet outpatient doctor visits} \usage{ pub_fluview( regions, - epiweeks, + epiweeks = "*", ..., issues = NULL, lag = NULL, @@ -21,7 +21,7 @@ on. Full list link below.} \item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch in the form \code{epirange(startweek, endweek)}, where startweek and endweek are of the form -YYYYWW (string or numeric).} +YYYYWW (string or numeric). Defaults to all ("*") dates.} \item{...}{not used for values, forces later arguments to bind by name} diff --git a/man/pub_fluview_clinical.Rd b/man/pub_fluview_clinical.Rd index 460179ac..a4017c76 100644 --- a/man/pub_fluview_clinical.Rd +++ b/man/pub_fluview_clinical.Rd @@ -2,11 +2,11 @@ % Please edit documentation in R/endpoints.R \name{pub_fluview_clinical} \alias{pub_fluview_clinical} -\title{FluView virological data from clinical labs} +\title{CDC FluView flu tests from clinical labs} \usage{ pub_fluview_clinical( regions, - epiweeks, + epiweeks = "*", ..., issues = NULL, lag = NULL, @@ -18,7 +18,7 @@ pub_fluview_clinical( \item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch in the form epirange(startweek,endweek), where startweek and endweek are of the form -YYYYWW (string or numeric).} +YYYYWW (string or numeric). Defaults to all ("*") dates.} \item{...}{not used for values, forces later arguments to bind by name} diff --git a/man/pub_fluview_meta.Rd b/man/pub_fluview_meta.Rd index 37816b84..ab0c0b1a 100644 --- a/man/pub_fluview_meta.Rd +++ b/man/pub_fluview_meta.Rd @@ -2,7 +2,7 @@ % Please edit documentation in R/endpoints.R \name{pub_fluview_meta} \alias{pub_fluview_meta} -\title{FluView metadata} +\title{Metadata for the FluView endpoint} \usage{ pub_fluview_meta(fetch_args = fetch_args_list()) } @@ -14,12 +14,14 @@ pub_fluview_meta(fetch_args = fetch_args_list()) } \description{ API docs: \url{https://cmu-delphi.github.io/delphi-epidata/api/fluview_meta.html} -Returns information about the fluview endpoint. } \examples{ \dontrun{ pub_fluview_meta() } +} +\seealso{ +\code{\link[=pub_fluview]{pub_fluview()}} } \keyword{endpoint} diff --git a/man/pub_gft.Rd b/man/pub_gft.Rd index 95d57239..c80d8d9a 100644 --- a/man/pub_gft.Rd +++ b/man/pub_gft.Rd @@ -2,14 +2,14 @@ % Please edit documentation in R/endpoints.R \name{pub_gft} \alias{pub_gft} -\title{Google Flu Trends data} +\title{Google Flu Trends flu search volume} \usage{ -pub_gft(locations, epiweeks, fetch_args = fetch_args_list()) +pub_gft(locations, epiweeks = "*", fetch_args = fetch_args_list()) } \arguments{ \item{locations}{character. Locations to fetch.} -\item{epiweeks}{\code{\link{timeset}} Epiweeks to fetch.} +\item{epiweeks}{\code{\link{timeset}} Epiweeks to fetch. Defaults to all ("*") dates.} \item{fetch_args}{\code{\link{fetch_args}}. Additional arguments to pass to \code{fetch()}.} } diff --git a/man/pub_kcdc_ili.Rd b/man/pub_kcdc_ili.Rd index f6107603..0c8b70f4 100644 --- a/man/pub_kcdc_ili.Rd +++ b/man/pub_kcdc_ili.Rd @@ -2,11 +2,11 @@ % Please edit documentation in R/endpoints.R \name{pub_kcdc_ili} \alias{pub_kcdc_ili} -\title{KCDC ILI data} +\title{KCDC ILI incidence (Korea)} \usage{ pub_kcdc_ili( regions, - epiweeks, + epiweeks = "*", ..., issues = NULL, lag = NULL, @@ -16,7 +16,7 @@ pub_kcdc_ili( \arguments{ \item{regions}{character. Regions to fetch.} -\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch.} +\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch. Defaults to all ("*") dates.} \item{...}{not used for values, forces later arguments to bind by name} diff --git a/man/pub_meta.Rd b/man/pub_meta.Rd index 438c17fb..202d3cfa 100644 --- a/man/pub_meta.Rd +++ b/man/pub_meta.Rd @@ -2,7 +2,7 @@ % Please edit documentation in R/endpoints.R \name{pub_meta} \alias{pub_meta} -\title{API metadata} +\title{Metadata for the Delphi Epidata API} \usage{ pub_meta(fetch_args = fetch_args_list()) } diff --git a/man/pub_nidss_dengue.Rd b/man/pub_nidss_dengue.Rd index b5e2aa90..67be9c94 100644 --- a/man/pub_nidss_dengue.Rd +++ b/man/pub_nidss_dengue.Rd @@ -2,14 +2,14 @@ % Please edit documentation in R/endpoints.R \name{pub_nidss_dengue} \alias{pub_nidss_dengue} -\title{NIDSS dengue data} +\title{NIDSS dengue cases (Taiwan)} \usage{ -pub_nidss_dengue(locations, epiweeks, fetch_args = fetch_args_list()) +pub_nidss_dengue(locations, epiweeks = "*", fetch_args = fetch_args_list()) } \arguments{ \item{locations}{character. Locations to fetch.} -\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch.} +\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch. Defaults to all ("*") dates.} \item{fetch_args}{\code{\link{fetch_args}}. Additional arguments to pass to \code{fetch()}.} } diff --git a/man/pub_nidss_flu.Rd b/man/pub_nidss_flu.Rd index 480b288c..946a1b87 100644 --- a/man/pub_nidss_flu.Rd +++ b/man/pub_nidss_flu.Rd @@ -2,11 +2,11 @@ % Please edit documentation in R/endpoints.R \name{pub_nidss_flu} \alias{pub_nidss_flu} -\title{NIDSS flu data} +\title{NIDSS flu doctor visits (Taiwan)} \usage{ pub_nidss_flu( regions, - epiweeks, + epiweeks = "*", ..., issues = NULL, lag = NULL, @@ -16,7 +16,7 @@ pub_nidss_flu( \arguments{ \item{regions}{character. Regions to fetch.} -\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch.} +\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch. Defaults to all ("*") dates.} \item{...}{not used for values, forces later arguments to bind by name} diff --git a/man/pub_nowcast.Rd b/man/pub_nowcast.Rd index 508d4fc1..306c37f1 100644 --- a/man/pub_nowcast.Rd +++ b/man/pub_nowcast.Rd @@ -2,14 +2,14 @@ % Please edit documentation in R/endpoints.R \name{pub_nowcast} \alias{pub_nowcast} -\title{Delphi's ILI nowcast} +\title{Delphi's ILI Nearby nowcasts} \usage{ -pub_nowcast(locations, epiweeks, fetch_args = fetch_args_list()) +pub_nowcast(locations, epiweeks = "*", fetch_args = fetch_args_list()) } \arguments{ \item{locations}{character. Locations to fetch.} -\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch.} +\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch. Defaults to all ("*") dates.} \item{fetch_args}{\code{\link{fetch_args}}. Additional arguments to pass to \code{fetch()}.} } diff --git a/man/pub_paho_dengue.Rd b/man/pub_paho_dengue.Rd index e99fbc5f..0d643f44 100644 --- a/man/pub_paho_dengue.Rd +++ b/man/pub_paho_dengue.Rd @@ -2,11 +2,11 @@ % Please edit documentation in R/endpoints.R \name{pub_paho_dengue} \alias{pub_paho_dengue} -\title{PAHO Dengue data} +\title{PAHO dengue data (North and South America)} \usage{ pub_paho_dengue( regions, - epiweeks, + epiweeks = "*", ..., issues = NULL, lag = NULL, @@ -16,7 +16,7 @@ pub_paho_dengue( \arguments{ \item{regions}{character. Regions to fetch.} -\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch.} +\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch. Defaults to all ("*") dates.} \item{...}{not used for values, forces later arguments to bind by name} diff --git a/man/pub_wiki.Rd b/man/pub_wiki.Rd index cde73d95..278dca58 100644 --- a/man/pub_wiki.Rd +++ b/man/pub_wiki.Rd @@ -2,13 +2,13 @@ % Please edit documentation in R/endpoints.R \name{pub_wiki} \alias{pub_wiki} -\title{Wikipedia access data} +\title{Wikipedia webpage counts by article} \usage{ pub_wiki( articles, ..., - dates = NULL, - epiweeks = NULL, + time_type = c("day", "week"), + time_values = "*", hours = NULL, language = "en", fetch_args = fetch_args_list() @@ -19,10 +19,11 @@ pub_wiki( \item{...}{not used for values, forces later arguments to bind by name} -\item{dates}{\code{\link{timeset}}. Dates to fetch. Mutually exclusive with \code{epiweeks}.} +\item{time_type}{string. The temporal resolution of the data (either "day" or +"week", depending on signal).} -\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch. Mutually exclusive with -\code{dates}.} +\item{time_values}{\code{\link{timeset}}. Dates or epiweeks to fetch. Defaults to all +("*") dates.} \item{hours}{integer. Optionally, the hours to fetch.} @@ -46,7 +47,11 @@ Number of page visits for selected English, Influenza-related wikipedia articles } \examples{ \dontrun{ -pub_wiki(articles = "avian_influenza", epiweeks = epirange(201501, 201601)) +pub_wiki( + articles = "avian_influenza", + time_type = "week", + time_values = epirange(201501, 201601) +) } } \keyword{endpoint} diff --git a/man/pvt_cdc.Rd b/man/pvt_cdc.Rd index 744ee76e..35cc555b 100644 --- a/man/pvt_cdc.Rd +++ b/man/pvt_cdc.Rd @@ -2,16 +2,16 @@ % Please edit documentation in R/endpoints.R \name{pvt_cdc} \alias{pvt_cdc} -\title{CDC page hits} +\title{CDC total and by topic webpage visits} \usage{ -pvt_cdc(auth, locations, epiweeks, fetch_args = fetch_args_list()) +pvt_cdc(auth, locations, epiweeks = "*", fetch_args = fetch_args_list()) } \arguments{ \item{auth}{string. Restricted access key (not the same as API key).} \item{locations}{character. Locations to fetch.} -\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch.} +\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch. Defaults to all ("*") dates.} \item{fetch_args}{\code{\link{fetch_args}}. Additional arguments to pass to \code{fetch()}. See \code{fetch_args_list()} for details.} diff --git a/man/pvt_dengue_sensors.Rd b/man/pvt_dengue_sensors.Rd index 47f50eaa..2ff7eb30 100644 --- a/man/pvt_dengue_sensors.Rd +++ b/man/pvt_dengue_sensors.Rd @@ -2,13 +2,13 @@ % Please edit documentation in R/endpoints.R \name{pvt_dengue_sensors} \alias{pvt_dengue_sensors} -\title{Dengue digital surveillance sensors in PAHO member countries} +\title{PAHO dengue digital surveillance sensors (North and South America)} \usage{ pvt_dengue_sensors( auth, names, locations, - epiweeks, + epiweeks = "*", fetch_args = fetch_args_list() ) } @@ -19,7 +19,7 @@ pvt_dengue_sensors( \item{locations}{character. Locations to fetch.} -\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch.} +\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch. Defaults to all ("*") dates.} \item{fetch_args}{\code{\link{fetch_args}}. Additional arguments to pass to \code{fetch()}.} } diff --git a/man/pvt_ght.Rd b/man/pvt_ght.Rd index 3366416f..7a16f10c 100644 --- a/man/pvt_ght.Rd +++ b/man/pvt_ght.Rd @@ -2,16 +2,16 @@ % Please edit documentation in R/endpoints.R \name{pvt_ght} \alias{pvt_ght} -\title{Google Health Trends data} +\title{Google Health Trends health topics search volume} \usage{ -pvt_ght(auth, locations, epiweeks, query, fetch_args = fetch_args_list()) +pvt_ght(auth, locations, epiweeks = "*", query, fetch_args = fetch_args_list()) } \arguments{ \item{auth}{string. Restricted access key (not the same as API key).} \item{locations}{character. Locations to fetch.} -\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch.} +\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch. Defaults to all ("*") dates.} \item{query}{string. The query to be fetched.} diff --git a/man/pvt_meta_norostat.Rd b/man/pvt_meta_norostat.Rd index e967e316..491c7218 100644 --- a/man/pvt_meta_norostat.Rd +++ b/man/pvt_meta_norostat.Rd @@ -2,7 +2,7 @@ % Please edit documentation in R/endpoints.R \name{pvt_meta_norostat} \alias{pvt_meta_norostat} -\title{NoroSTAT metadata} +\title{Metadata for the NoroSTAT endpoint} \usage{ pvt_meta_norostat(auth, fetch_args = fetch_args_list()) } @@ -22,4 +22,7 @@ API docs: \url{https://cmu-delphi.github.io/delphi-epidata/api/meta_norostat.htm pvt_meta_norostat(auth = Sys.getenv("SECRET_API_AUTH_NOROSTAT")) } } +\seealso{ +\code{\link[=pvt_norostat]{pvt_norostat()}} +} \keyword{endpoint} diff --git a/man/pvt_norostat.Rd b/man/pvt_norostat.Rd index 60808134..24ffd778 100644 --- a/man/pvt_norostat.Rd +++ b/man/pvt_norostat.Rd @@ -2,16 +2,16 @@ % Please edit documentation in R/endpoints.R \name{pvt_norostat} \alias{pvt_norostat} -\title{NoroSTAT data (point data, no min/max)} +\title{CDC NoroSTAT norovirus outbreaks} \usage{ -pvt_norostat(auth, locations, epiweeks, fetch_args = fetch_args_list()) +pvt_norostat(auth, locations, epiweeks = "*", fetch_args = fetch_args_list()) } \arguments{ \item{auth}{string. Your authentication key.} \item{locations}{character. Locations to fetch.} -\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch.} +\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch. Defaults to all ("*") dates.} \item{fetch_args}{\code{\link{fetch_args}}. Additional arguments to pass to \code{fetch()}.} } @@ -19,10 +19,12 @@ pvt_norostat(auth, locations, epiweeks, fetch_args = fetch_args_list()) \code{\link[tibble:tibble]{tibble::tibble}} } \description{ +This is point data only, and does not include minima or maxima. + API docs: \url{https://cmu-delphi.github.io/delphi-epidata/api/norostat.html} -This is the documentation of the API for accessing the NoroSTAT (norostat) -endpoint of the Delphi’s epidemiological data. +This is the documentation of the API for accessing the NoroSTAT endpoint of +the Delphi’s epidemiological data. } \examples{ \dontrun{ diff --git a/man/pvt_quidel.Rd b/man/pvt_quidel.Rd index 909df751..10ca3c0a 100644 --- a/man/pvt_quidel.Rd +++ b/man/pvt_quidel.Rd @@ -4,14 +4,14 @@ \alias{pvt_quidel} \title{Quidel COVID-19 and influenza testing data} \usage{ -pvt_quidel(auth, locations, epiweeks, fetch_args = fetch_args_list()) +pvt_quidel(auth, locations, epiweeks = "*", fetch_args = fetch_args_list()) } \arguments{ \item{auth}{string. Restricted access key (not the same as API key).} \item{locations}{character. Locations to fetch.} -\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch.} +\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch. Defaults to all ("*") dates.} \item{fetch_args}{\code{\link{fetch_args}}. Additional arguments to pass to \code{fetch()}.} } diff --git a/man/pvt_sensors.Rd b/man/pvt_sensors.Rd index 0d88e2dd..35e41bf0 100644 --- a/man/pvt_sensors.Rd +++ b/man/pvt_sensors.Rd @@ -2,9 +2,15 @@ % Please edit documentation in R/endpoints.R \name{pvt_sensors} \alias{pvt_sensors} -\title{Digital surveillance sensors} +\title{Influenza and dengue digital surveillance sensors} \usage{ -pvt_sensors(auth, names, locations, epiweeks, fetch_args = fetch_args_list()) +pvt_sensors( + auth, + names, + locations, + epiweeks = "*", + fetch_args = fetch_args_list() +) } \arguments{ \item{auth}{string. Restricted access key (not the same as API key).} @@ -13,7 +19,7 @@ pvt_sensors(auth, names, locations, epiweeks, fetch_args = fetch_args_list()) \item{locations}{character. Locations to fetch.} -\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch.} +\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch. Defaults to all ("*") dates.} \item{fetch_args}{\code{\link{fetch_args}}. Additional arguments to pass to \code{fetch()}.} } @@ -24,7 +30,7 @@ pvt_sensors(auth, names, locations, epiweeks, fetch_args = fetch_args_list()) API docs: \url{https://cmu-delphi.github.io/delphi-epidata/api/sensors.html} This is the documentation of the API for accessing the Digital Surveillance -Sensors (sensors) endpoint of the Delphi’s epidemiological Note: this +Sensors endpoint of the Delphi’s epidemiological. Note: this repository was built to support modeling and forecasting efforts surrounding seasonal influenza (and dengue). In the current COVID-19 pandemic, syndromic surveillance data, like ILI data (influenza-like diff --git a/man/pvt_twitter.Rd b/man/pvt_twitter.Rd index 92ee2c39..b6c6e95f 100644 --- a/man/pvt_twitter.Rd +++ b/man/pvt_twitter.Rd @@ -2,14 +2,14 @@ % Please edit documentation in R/endpoints.R \name{pvt_twitter} \alias{pvt_twitter} -\title{HealthTweets data} +\title{HealthTweets total and influenza-related tweets} \usage{ pvt_twitter( auth, locations, ..., - dates = NULL, - epiweeks = NULL, + time_type = c("day", "week"), + time_values = "*", fetch_args = fetch_args_list() ) } @@ -20,10 +20,11 @@ pvt_twitter( \item{...}{not used for values, forces later arguments to bind by name} -\item{dates}{\code{\link{timeset}}. Dates to fetch. Mutually exclusive with \code{epiweeks}.} +\item{time_type}{string. The temporal resolution of the data (either "day" or +"week", depending on signal).} -\item{epiweeks}{\code{\link{timeset}}. Epiweeks to fetch. Mutually exclusive with -\code{dates}.} +\item{time_values}{\code{\link{timeset}}. Dates or epiweeks to fetch. Defaults to all +("*") dates.} \item{fetch_args}{\code{\link{fetch_args}}. Additional arguments to pass to \code{fetch()}.} } @@ -33,15 +34,17 @@ pvt_twitter( \description{ API docs: \url{https://cmu-delphi.github.io/delphi-epidata/api/twitter.html} -This is the API documentation for accessing the Twitter Stream (twitter) endpoint of Delphi’s epidemiological data. -Sourced from \href{http://www.healthtweets.org/}{Healthtweets} +This is the API documentation for accessing the Twitter Stream endpoint of +Delphi’s epidemiological data. Sourced from +\href{http://www.healthtweets.org/}{Healthtweets} } \examples{ \dontrun{ pvt_twitter( auth = Sys.getenv("SECRET_API_AUTH_TWITTER"), locations = "CA", - epiweeks = epirange(201501, 202001) + time_type = "week", + time_values = epirange(201501, 202001) ) } } diff --git a/man/reformat_epirange.Rd b/man/reformat_epirange.Rd new file mode 100644 index 00000000..5341c521 --- /dev/null +++ b/man/reformat_epirange.Rd @@ -0,0 +1,12 @@ +% Generated by roxygen2: do not edit by hand +% Please edit documentation in R/model.R +\name{reformat_epirange} +\alias{reformat_epirange} +\title{helper to convert an epirange from week to day or vice versa} +\usage{ +reformat_epirange(epirange, to_type = c("day", "week")) +} +\description{ +helper to convert an epirange from week to day or vice versa +} +\keyword{internal} diff --git a/man/release_bullets.Rd b/man/release_bullets.Rd new file mode 100644 index 00000000..64e1341b --- /dev/null +++ b/man/release_bullets.Rd @@ -0,0 +1,12 @@ +% Generated by roxygen2: do not edit by hand +% Please edit documentation in R/utils.R +\name{release_bullets} +\alias{release_bullets} +\title{inserts each string as a bullet at the end of the "Prepare for release" section} +\usage{ +release_bullets() +} +\description{ +inserts each string as a bullet at the end of the "Prepare for release" section +} +\keyword{internal} diff --git a/man/request_impl.Rd b/man/request_impl.Rd index 476c7ee2..d6ad7669 100644 --- a/man/request_impl.Rd +++ b/man/request_impl.Rd @@ -5,7 +5,7 @@ \title{Makes a request to the API and returns the response, catching HTTP errors and forwarding the HTTP body in R errors} \usage{ -request_impl(epidata_call, format_type, fields = NULL, timeout_seconds = 30) +request_impl(epidata_call, format_type, timeout_seconds, fields) } \description{ Makes a request to the API and returns the response, catching diff --git a/man/set_cache.Rd b/man/set_cache.Rd index 87c147f0..6787edf0 100644 --- a/man/set_cache.Rd +++ b/man/set_cache.Rd @@ -9,14 +9,15 @@ set_cache( days = NULL, max_size = NULL, logfile = NULL, - confirm = TRUE + confirm = TRUE, + startup = FALSE ) } \arguments{ \item{cache_dir}{the directory in which the cache is stored. By default, this -is \code{tools::R_user_dir()} if on R 4.0+, but must be specified for earlier -versions of R. The path can be either relative or absolute. The -environmental variable is \code{EPIDATR_CACHE_DIR}.} +is \code{rappdirs::user_cache_dir("R", version = "epidatr")}. The path can be +either relative or absolute. The environmental variable is +\code{EPIDATR_CACHE_DIR}.} \item{days}{the maximum length of time in days to keep any particular cached call. By default this is \code{1}. The environmental variable is @@ -32,6 +33,9 @@ variable is \code{EPIDATR_CACHE_LOGFILE}.} \item{confirm}{whether to confirm directory creation. default is \code{TRUE}; should only be set in non-interactive scripts} + +\item{startup}{indicates whether the function is being called on +startup. Affects suppressability of the messages. Default is \code{FALSE}.} } \value{ \code{\link{NULL}} no return value, all effects are stored in the package @@ -64,7 +68,7 @@ An important feature of the caching in this package is that only calls which specify either \code{issues} before a certain date, or \code{as_of} before a certain date will actually cache. For example the call -\if{html}{\out{
}}\preformatted{covidcast( +\if{html}{\out{
}}\preformatted{pub_covidcast( source = "jhu-csse", signals = "confirmed_7dav_incidence_prop", geo_type = "state", @@ -77,7 +81,7 @@ date will actually cache. For example the call \emph{won't} cache, since it is possible for the cache to be invalidated by new releases with no warning. On the other hand, the call -\if{html}{\out{
}}\preformatted{covidcast( +\if{html}{\out{
}}\preformatted{pub_covidcast( source = "jhu-csse", signals = "confirmed_7dav_incidence_prop", geo_type = "state", diff --git a/man/timeset.Rd b/man/timeset.Rd index 5d49151d..6dcdc2b8 100644 --- a/man/timeset.Rd +++ b/man/timeset.Rd @@ -2,26 +2,26 @@ % Please edit documentation in R/model.R \name{timeset} \alias{timeset} -\title{Timeset} +\title{Timeset formats for specifying dates} \description{ Many API calls accept timesets to specify the time ranges of data being requested. Timesets can be specified with \code{epirange()}, as \code{Date} objects, or with wildcards. - -Timesets are not special R types; the term simply describes any value that -would be accepted by epidatr to specify the time value of an epidata query. -The allowed values are: +} +\details{ +Timesets are not special R types; the term simply describes any value that is +accepted by epidatr to specify the time value of an epidata query: \itemize{ -\item Dates: \code{Date} instances, integer-like values, or integer-like strings that -take the form YYYYMMDD. -\item Epiweeks: Integer-like values or integer-like strings that take the form -YYYYWW. +\item Dates: \code{Date} instances. +\item Date strings or integers: Strings or integers in the format YYYYMMDD. +\item Epiweeks: Strings or integers in the format YYYYWW, where WW is the epiweek +number. \item EpiRanges: A range returned by \code{epirange()}, or a list of multiple ranges. -\item Wildcard: The string \code{"*"}, which request all available time values. +\item Wildcard: The string \code{"*"}, which requests all available time values. } -Please refer to the specific endpoint documentation for guidance on using -dates vs weeks. Most endpoints support only one or the other. Some (less -commonly used) endpoints may not accept the \code{"*"} wildcard, but this can be -simulated with a large \code{epirange()}. +Refer to the specific endpoint documentation for guidance on using dates vs +weeks. Most endpoints support only one or the other. Some (less commonly +used) endpoints may not accept the \code{"*"} wildcard, but this can be simulated +with a large \code{epirange()}. } diff --git a/tests/testthat/generate_test_data.R b/tests/testthat/generate_test_data.R index 95032fba..834de416 100644 --- a/tests/testthat/generate_test_data.R +++ b/tests/testthat/generate_test_data.R @@ -4,7 +4,8 @@ epidata_call %>% url <- full_url(epidata_call) params <- request_arguments(epidata_call, "csv", NULL) -result <- do_request(url, params) %>% readr::write_rds(testthat::test_path("data/test-http401.rds")) +result <- do_request(url, params, timeout_seconds = 10 * 60) %>% + readr::write_rds(testthat::test_path("data/test-http401.rds")) epidata_call <- pvt_afhsb( auth = Sys.getenv("SECRET_API_AUTH_AFHSB"), @@ -14,7 +15,8 @@ epidata_call <- pvt_afhsb( ) url <- full_url(epidata_call) params <- request_arguments(epidata_call, "csv", NULL) -response <- do_request(url, params) %>% readr::write_rds(testthat::test_path("data/test-http500.rds")) +response <- do_request(url, params, timeout_seconds = 10 * 60) %>% + readr::write_rds(testthat::test_path("data/test-http500.rds")) epidata_call %>% fetch_debug(format_type = "classic") %>% @@ -33,5 +35,5 @@ response <- httr::RETRY("GET", query = list(), terminate_on = c(400, 401, 403, 405, 414, 500), http_headers, - httr::authenticate("epidata", get_auth_key()) + httr::authenticate("epidata", get_api_key()) ) %>% readr::write_rds(testthat::test_path("data/test-do_request-httpbin.rds")) diff --git a/tests/testthat/test-auth.R b/tests/testthat/test-auth.R index 3aa07cd3..660b18e7 100644 --- a/tests/testthat/test-auth.R +++ b/tests/testthat/test-auth.R @@ -1,15 +1,5 @@ -test_that("get_auth_key", { +test_that("get_api_key", { withr::with_envvar(c(DELPHI_EPIDATA_KEY = "epidata_key_from_envvar"), { - withr::with_options(list(delphi.epidata.key = "epidata_key_from_options"), { - # envvar takes precedence over option (characterization test; we don't - # guarantee this in docs): - expect_identical(get_auth_key(), "epidata_key_from_envvar") - }) - }) - withr::with_envvar(c(DELPHI_EPIDATA_KEY = NA_character_), { - withr::with_options(list(delphi.epidata.key = "epidata_key_from_options"), { - # option by itself works: - expect_identical(get_auth_key(), "epidata_key_from_options") - }) + expect_identical(get_api_key(), "epidata_key_from_envvar") }) }) diff --git a/tests/testthat/test-endpoints.R b/tests/testthat/test-endpoints.R index 3c81dea1..39194535 100644 --- a/tests/testthat/test-endpoints.R +++ b/tests/testthat/test-endpoints.R @@ -37,14 +37,14 @@ test_that("basic_epidata_call", { fetch_args = fetch_args_list(dry_run = TRUE) ) %>% request_url()) expect_no_error(pub_dengue_nowcast( - locations = "?", + locations = "ca", epiweeks = epirange(201501, 202001), fetch_args = fetch_args_list(dry_run = TRUE) ) %>% request_url()) expect_no_error(pvt_dengue_sensors( auth = "yourkey", - names = "?", - locations = "?", + names = "ght", + locations = "ag", epiweeks = epirange(201501, 202001), fetch_args = fetch_args_list(dry_run = TRUE) ) %>% request_url()) @@ -80,11 +80,11 @@ test_that("basic_epidata_call", { auth = "yourkey", locations = "ca", epiweeks = epirange(201201, 202001), - query = "?", + query = "how to get over the flu", fetch_args = fetch_args_list(dry_run = TRUE) ) %>% request_url()) expect_no_error(pub_kcdc_ili( - regions = "?", + regions = "ROK", epiweeks = epirange(201201, 202001), fetch_args = fetch_args_list(dry_run = TRUE) ) %>% request_url()) @@ -137,12 +137,383 @@ test_that("basic_epidata_call", { expect_no_error(pvt_twitter( auth = "yourkey", locations = "CA", - epiweeks = epirange(201501, 202001), + time_type = "week", + time_values = epirange(201501, 202001), + fetch_args = fetch_args_list(dry_run = TRUE) + ) %>% request_url()) + expect_no_error(pvt_twitter( + auth = "yourkey", + locations = "CA", + time_type = "day", + time_values = epirange(20150101, 20200101), fetch_args = fetch_args_list(dry_run = TRUE) ) %>% request_url()) expect_no_error(pub_wiki( articles = "avian_influenza", - epiweeks = epirange(201501, 202001), + time_type = "week", + time_values = epirange(201501, 202001), + fetch_args = fetch_args_list(dry_run = TRUE) + ) %>% request_url()) + expect_no_error(pub_wiki( + articles = "avian_influenza", + time_type = "day", + time_values = epirange(20150101, 20200101), fetch_args = fetch_args_list(dry_run = TRUE) ) %>% request_url()) }) + +test_that("endoints accept wildcard for date parameter", { + expect_no_error(call <- pvt_cdc( + auth = "yourkey", + "fl,ca", + "*", + fetch_args = fetch_args_list(dry_run = TRUE) + )) + expect_identical(call$params$epiweeks$from, 100001) + expect_identical(call$params$epiweeks$to, 300001) + + expect_identical(call$params$epiweeks$from, 100001) + expect_identical(call$params$epiweeks$to, 300001) + + expect_no_error(call <- pub_covid_hosp_facility( + hospital_pks = "100075", + collection_weeks = "*", + fetch_args = fetch_args_list(dry_run = TRUE) + )) + expect_identical(call$params$collection_weeks$from, 10000101) + expect_identical(call$params$collection_weeks$to, 30000101) + + expect_no_error(call <- pub_covid_hosp_state_timeseries( + states = "fl", + dates = "*", + fetch_args = fetch_args_list(dry_run = TRUE) + )) + expect_identical(call$params$dates$from, 10000101) + expect_identical(call$params$dates$to, 30000101) + + expect_no_error(call <- pub_covidcast( + source = "jhu-csse", + signals = "confirmed_7dav_incidence_prop", + time_type = "day", + geo_type = "state", + time_values = "*", + geo_values = "ca,fl", + fetch_args = fetch_args_list(dry_run = TRUE) + )) + expect_identical(call$params$time_values, "*") + + expect_no_error(call <- pub_dengue_nowcast( + locations = "ca", + epiweeks = "*", + fetch_args = fetch_args_list(dry_run = TRUE) + )) + expect_identical(call$params$epiweeks$from, 100001) + expect_identical(call$params$epiweeks$to, 300001) + + expect_no_error(call <- pvt_dengue_sensors( + auth = "yourkey", + names = "ght", + locations = "ag", + epiweeks = "*", + fetch_args = fetch_args_list(dry_run = TRUE) + )) + expect_identical(call$params$epiweeks$from, 100001) + expect_identical(call$params$epiweeks$to, 300001) + + expect_no_error(call <- pub_ecdc_ili( + regions = "austria", + epiweeks = "*", + fetch_args = fetch_args_list(dry_run = TRUE) + )) + expect_identical(call$params$epiweeks$from, 100001) + expect_identical(call$params$epiweeks$to, 300001) + + expect_no_error(call <- pub_flusurv( + locations = "CA", + epiweeks = "*", + fetch_args = fetch_args_list(dry_run = TRUE) + )) + expect_identical(call$params$epiweeks$from, 100001) + expect_identical(call$params$epiweeks$to, 300001) + + expect_no_error(call <- pub_fluview_clinical( + regions = "nat", + epiweeks = "*", + fetch_args = fetch_args_list(dry_run = TRUE) + )) + expect_identical(call$params$epiweeks$from, 100001) + expect_identical(call$params$epiweeks$to, 300001) + + expect_no_error(call <- pub_fluview( + regions = "nat", + epiweeks = "*", + fetch_args = fetch_args_list(dry_run = TRUE) + )) + expect_identical(call$params$epiweeks$from, 100001) + expect_identical(call$params$epiweeks$to, 300001) + + expect_no_error(call <- pub_gft( + locations = "hhs1", + epiweeks = "*", + fetch_args = fetch_args_list(dry_run = TRUE) + )) + expect_identical(call$params$epiweeks$from, 100001) + expect_identical(call$params$epiweeks$to, 300001) + + expect_no_error(call <- pvt_ght( + auth = "yourkey", + locations = "ca", + epiweeks = "*", + query = "how to get over the flu", + fetch_args = fetch_args_list(dry_run = TRUE) + )) + expect_identical(call$params$epiweeks$from, 100001) + expect_identical(call$params$epiweeks$to, 300001) + + expect_no_error(call <- pub_kcdc_ili( + regions = "ROK", + epiweeks = "*", + fetch_args = fetch_args_list(dry_run = TRUE) + )) + expect_identical(call$params$epiweeks$from, 100001) + expect_identical(call$params$epiweeks$to, 300001) + + expect_no_error(call <- pub_nidss_dengue( + locations = "taipei", + epiweeks = "*", + fetch_args = fetch_args_list(dry_run = TRUE) + )) + expect_identical(call$params$epiweeks$from, 100001) + expect_identical(call$params$epiweeks$to, 300001) + + expect_no_error(call <- pub_nidss_flu( + regions = "taipei", + epiweeks = "*", + fetch_args = fetch_args_list(dry_run = TRUE) + )) + expect_identical(call$params$epiweeks$from, 100001) + expect_identical(call$params$epiweeks$to, 300001) + + expect_no_error(call <- pvt_norostat( + auth = "yourkey", + locations = "Minnesota, Ohio, Oregon, Tennessee, and Wisconsin", + epiweeks = "*", + fetch_args = fetch_args_list(dry_run = TRUE) + )) + expect_identical(call$params$epiweeks$from, 100001) + expect_identical(call$params$epiweeks$to, 300001) + + expect_no_error(call <- pub_nowcast( + locations = "ca", + epiweeks = "*", + fetch_args = fetch_args_list(dry_run = TRUE) + )) + expect_identical(call$params$epiweeks$from, 100001) + expect_identical(call$params$epiweeks$to, 300001) + + expect_no_error(call <- pub_paho_dengue( + regions = "ca", + epiweeks = "*", + fetch_args = fetch_args_list(dry_run = TRUE) + )) + expect_identical(call$params$epiweeks$from, 100001) + expect_identical(call$params$epiweeks$to, 300001) + + expect_no_error(call <- pvt_quidel( + auth = "yourkey", + locations = "hhs1", + epiweeks = "*", + fetch_args = fetch_args_list(dry_run = TRUE) + )) + expect_identical(call$params$epiweeks$from, 100001) + expect_identical(call$params$epiweeks$to, 300001) + + expect_no_error(call <- pvt_sensors( + auth = "yourkey", + names = "sar3", + locations = "nat", + epiweeks = "*", + fetch_args = fetch_args_list(dry_run = TRUE) + )) + expect_identical(call$params$epiweeks$from, 100001) + expect_identical(call$params$epiweeks$to, 300001) + + expect_no_error(call <- pvt_twitter( + auth = "yourkey", + locations = "CA", + time_type = "week", + time_values = "*", + fetch_args = fetch_args_list(dry_run = TRUE) + )) + expect_identical(call$params$epiweeks$from, 100001) + expect_identical(call$params$epiweeks$to, 300001) + + expect_no_error(call <- pvt_twitter( + auth = "yourkey", + locations = "CA", + time_type = "day", + time_values = "*", + fetch_args = fetch_args_list(dry_run = TRUE) + )) + expect_identical(call$params$dates$from, 10000101) + expect_identical(call$params$dates$to, 30000101) + + expect_no_error(call <- pub_wiki( + articles = "avian_influenza", + time_type = "week", + time_values = "*", + fetch_args = fetch_args_list(dry_run = TRUE) + )) + expect_identical(call$params$epiweeks$from, 100001) + expect_identical(call$params$epiweeks$to, 300001) + + expect_no_error(call <- pub_wiki( + articles = "avian_influenza", + time_type = "day", + time_values = "*", + fetch_args = fetch_args_list(dry_run = TRUE) + )) + expect_identical(call$params$dates$from, 10000101) + expect_identical(call$params$dates$to, 30000101) +}) + +test_that("endpoints fail when given args via dots", { + dots_error <- "`...` must be empty" + + # time value/epiweek arg is passed erroneously as `date_range` + expect_error( + pub_covid_hosp_facility_lookup( + state = "fl", + date_range = 20200101 + ), + regexp = dots_error + ) + expect_error( + pub_covid_hosp_facility( + hospital_pks = "100075", + date_range = epirange(20200101, 20200501) + ), + regexp = dots_error + ) + expect_error( + pub_covid_hosp_state_timeseries( + states = "fl", + date_range = epirange(20200101, 20200501) + ), + regexp = dots_error + ) + expect_error( + pub_covidcast( + source = "jhu-csse", + signals = "confirmed_7dav_incidence_prop", + time_type = "day", + geo_type = "state", + date_range = epirange(20200601, 20200801), + geo_values = "ca,fl" + ), + regexp = dots_error + ) + expect_error( + pub_ecdc_ili( + regions = "austria", + date_range = epirange(201201, 202001) + ), + regexp = dots_error + ) + expect_error( + pub_flusurv( + locations = "CA", + date_range = epirange(201201, 202001) + ), + regexp = dots_error + ) + expect_error( + pub_fluview_clinical( + regions = "nat", + date_range = epirange(201601, 201701) + ), + regexp = dots_error + ) + expect_error( + pub_fluview( + regions = "nat", + date_range = epirange(201601, 201701) + ), + regexp = dots_error + ) + expect_error( + pub_kcdc_ili( + regions = "ROK", + date_range = epirange(201201, 202001) + ), + regexp = dots_error + ) + expect_error( + pub_nidss_flu( + regions = "taipei", + date_range = epirange(201201, 202001) + ), + regexp = dots_error + ) + expect_error( + pub_paho_dengue( + regions = "ca", + date_range = epirange(201201, 202001) + ), + regexp = dots_error + ) + expect_error( + pvt_twitter( + auth = "yourkey", + locations = "CA", + time_type = "week", + time_range = epirange(201501, 202001) + ), + regexp = dots_error + ) + expect_error( + pub_wiki( + articles = "avian_influenza", + time_type = "week", + date_range = epirange(201501, 202001) + ), + regexp = dots_error + ) +}) + +test_that("pub_covid_hosp_state_timeseries supports versioned queries", { + epidata_call <- pub_covid_hosp_state_timeseries( + "ut", epirange(12340101, 34560101), + issues = 20220101, + fetch_args = fetch_args_list( + fields = c( + "state", "geocoded_state", "date", "issue", + "previous_day_admission_influenza_confirmed", + "previous_day_admission_influenza_confirmed_coverage" + ), + disable_date_parsing = TRUE, + dry_run = TRUE + ) + ) + expect_identical(epidata_call$params$issues, 20220101) + expect_identical(epidata_call$params$as_of, NULL) + # COVID hosp state timeseries server code doesn't support `lag` + expect_identical(epidata_call$params$lag, NULL) + + epidata_call <- pub_covid_hosp_state_timeseries( + "ut", epirange(12340101, 34560101), + as_of = 20220101, + fetch_args = fetch_args_list( + fields = c( + "state", "geocoded_state", "date", "issue", + "previous_day_admission_influenza_confirmed", + "previous_day_admission_influenza_confirmed_coverage" + ), + disable_date_parsing = TRUE, + dry_run = TRUE + ) + ) + expect_identical(epidata_call$params$issues, NULL) + expect_identical(epidata_call$params$as_of, 20220101) + expect_identical(epidata_call$params$lag, NULL) +}) diff --git a/tests/testthat/test-epidatacall.R b/tests/testthat/test-epidatacall.R index b0d171d8..028ba1f4 100644 --- a/tests/testthat/test-epidatacall.R +++ b/tests/testthat/test-epidatacall.R @@ -10,7 +10,11 @@ test_that("request_impl http errors", { # see generate_test_data.R do_request = function(...) readRDS(testthat::test_path("data/test-http401.rds")), ) - expect_error(response <- epidata_call %>% request_impl("csv"), class = "http_401") + expect_error( + response <- epidata_call %>% + request_impl("csv", timeout_seconds = 30, fields = NULL), + class = "http_401" + ) # should give a 500 error (the afhsb endpoint is removed) @@ -18,7 +22,11 @@ test_that("request_impl http errors", { local_mocked_bindings( do_request = function(...) readRDS(testthat::test_path("data/test-http500.rds")) ) - expect_error(response <- epidata_call %>% request_impl("csv"), class = "http_500") + expect_error( + response <- epidata_call %>% + request_impl("csv", timeout_seconds = 30, fields = NULL), + class = "http_500" + ) }) test_that("fetch_args", { @@ -30,7 +38,7 @@ test_that("fetch_args", { disable_date_parsing = FALSE, disable_data_frame_parsing = FALSE, return_empty = FALSE, - timeout_seconds = 30, + timeout_seconds = 15 * 60, base_url = NULL, dry_run = FALSE, debug = FALSE, @@ -160,3 +168,53 @@ test_that("classic only fetch", { # making sure that fetch_tbl and throws the expected error on classic only expect_error(epidata_call %>% fetch_tbl(), class = "only_supports_classic_format") }) + +test_that("create_epidata_call basic behavior", { + endpoint <- "endpoint" + params <- list() + + # Success + meta <- list( + create_epidata_field_info("time_value", "date"), + create_epidata_field_info("value", "float") + ) + expected <- list( + endpoint = endpoint, + params = params, + base_url = "https://api.delphi.cmu.edu/epidata/", + meta = meta, + only_supports_classic = FALSE + ) + class(expected) <- "epidata_call" + expect_identical(create_epidata_call(endpoint, params, meta = meta), expected) + + expected$meta <- list() + expect_identical(create_epidata_call(endpoint, params, meta = NULL), expected) + expect_identical(create_epidata_call(endpoint, params, meta = list()), expected) +}) + + +test_that("create_epidata_call fails when meta arg contains duplicates", { + endpoint <- "endpoint" + params <- list() + + # Duplicate names + meta <- list( + create_epidata_field_info("time_value", "date"), + create_epidata_field_info("time_value", "int") + ) + expect_error( + create_epidata_call(endpoint, params, meta = meta), + class = "epidatr__duplicate_meta_names" + ) + + # Duplicate entries + meta <- list( + create_epidata_field_info("time_value", "date"), + create_epidata_field_info("time_value", "date") + ) + expect_error( + create_epidata_call(endpoint, params, meta = meta), + class = "epidatr__duplicate_meta_entries" + ) +}) diff --git a/tests/testthat/test-model.R b/tests/testthat/test-model.R index 7a05aa0e..5444eb5e 100644 --- a/tests/testthat/test-model.R +++ b/tests/testthat/test-model.R @@ -57,11 +57,12 @@ test_that("null parsing", { # see generate_test_data.R mock_df <- as.data.frame(readr::read_rds(testthat::test_path("data/flusurv-epiweeks.rds"))) metadata <- epidata_call$meta - mock_df[[metadata[[1]]$name]][1] <- list(NULL) + mock_df[[metadata[[1]]$name]][1] <- NA mock_df[[metadata[[2]]$name]] <- c(TRUE) epidata_call$meta[[2]]$type <- "bool" - res <- parse_data_frame(epidata_call, mock_df) %>% as_tibble() + expect_no_error(res <- parse_data_frame(epidata_call, mock_df) %>% as_tibble()) expect_true(res$location) + expect_identical(res$release_date, as.Date(NA)) # if the call has no metadata, return the whole frame as is epidata_call$meta <- NULL @@ -69,7 +70,124 @@ test_that("null parsing", { }) test_that("parse invalid time", { - vale <- list(3) - vale$class <- "my nonexistant class" - expect_error(parse_timeset_input(vale)) + value <- list(3) + value$class <- "my nonexistant class" + expect_error(parse_timeset_input(value)) +}) + +test_that("parse_data_frame warns when df contains fields not listed in meta", { + epidata_call <- pub_flusurv( + locations = "ca", + epiweeks = 202001, + fetch_args = fetch_args_list(dry_run = TRUE) + ) + # see generate_test_data.R + mock_df <- as.data.frame(readr::read_rds(testthat::test_path("data/flusurv-epiweeks.rds"))) + + # Success when meta and df fields match exactly + expect_no_warning(parse_data_frame(epidata_call, mock_df)) + + # Warning when df contains extra fields + mock_df$extra <- 5 + expect_warning( + parse_data_frame(epidata_call, mock_df), + class = "epidatr__missing_meta_fields" + ) + mock_df$extra <- NULL + + # Success when meta contains extra fields + mock_df$rate_age_0 <- NULL + expect_no_warning(parse_data_frame(epidata_call, mock_df)) +}) + +test_that("parse_data_frame warns when df contains int values with decimal component", { + epidata_call <- pub_flusurv( + locations = "ca", + epiweeks = 202001, + fetch_args = fetch_args_list(dry_run = TRUE) + ) + # see generate_test_data.R + mock_df <- as.data.frame(readr::read_rds(testthat::test_path("data/flusurv-epiweeks.rds"))) + + # Int fields are returned as double + result <- parse_data_frame(epidata_call, mock_df) + expect_type(result$lag, "double") + + # Replace int fields with decimal + mock_df$lag <- 4.3 + + # Warning when int values have a decimal component + expect_warning( + parse_data_frame(epidata_call, mock_df), + class = "epidatr__int_nonzero_decimal_digits" + ) +}) + +test_that("parse_value can handle NA/NULL values in an int field", { + info <- create_epidata_field_info( + name = "test", + type = "int" + ) + expect_warning( + parse_value(info, c(1, 1.5, NA, NULL)), + class = "epidatr__int_nonzero_decimal_digits" + ) +}) + +test_that("parse_api_date accepts str and int input", { + expect_identical(parse_api_date("20200101"), as.Date("2020-01-01")) + expect_identical(parse_api_date(20200101), as.Date("2020-01-01")) +}) + +test_that("parse_api_date accepts YYYYMMDD and YYYY-MM-DD", { + expect_identical(parse_api_date(20200101), as.Date("2020-01-01")) + expect_identical(parse_api_date("2020-01-01"), as.Date("2020-01-01")) +}) + +test_that("parse_api_date handles missing values appropriately", { + expect_identical(parse_api_date(NA), as.Date(NA)) +}) + +test_that("date_to_epiweek accepts str and int input", { + expect_identical(date_to_epiweek("20200101"), 202001) + expect_identical(date_to_epiweek(20200101), 202001) +}) + +test_that("date_to_epiweek accepts single and double-digit weeks", { + expect_identical(date_to_epiweek(20201101), 202045) + expect_identical(date_to_epiweek(20200109), 202002) +}) + +test_that("reformat_epirange works in basic cases", { + # Week to week + result <- reformat_epirange(epirange(202002, 202013), "week") + expect_identical(result, epirange(202002, 202013)) + + result <- reformat_epirange(epirange("202002", "202013"), "week") + expect_identical(result, epirange("202002", "202013")) + + # Week to day + # Across year boundary + result <- reformat_epirange(epirange(202001, 202013), "day") + expect_identical(result, epirange(20191229, 20200322)) + + result <- reformat_epirange(epirange(202002, 202013), "day") + expect_identical(result, epirange(20200105, 20200322)) + + result <- reformat_epirange(epirange("202002", "202013"), "day") + expect_identical(result, epirange(20200105, 20200322)) + + # Day to week + result <- reformat_epirange(epirange(20200201, 20201031), "week") + expect_identical(result, epirange(202005, 202044)) + + result <- reformat_epirange(epirange("20200201", "20201031"), "week") + expect_identical(result, epirange(202005, 202044)) + + # Day to day + result <- reformat_epirange(epirange(20200201, 20201031), "day") + expect_identical(result, epirange(20200201, 20201031)) + + result <- reformat_epirange(epirange("20200201", "20201031"), "day") + expect_identical(result, epirange("20200201", "20201031")) }) diff --git a/tests/testthat/test-request.R b/tests/testthat/test-request.R index da09f858..6a3d6536 100644 --- a/tests/testthat/test-request.R +++ b/tests/testthat/test-request.R @@ -1,4 +1,4 @@ test_that("requesting works", { - res <- do_request("https://httpbin.org/status/414", list()) + res <- do_request("https://httpbin.org/status/414", list(), timeout_seconds = 10 * 60) expect_equal(res$status_code, 414) }) diff --git a/tests/testthat/test-utils.R b/tests/testthat/test-utils.R index ad0e6c8f..1ed8fbe6 100644 --- a/tests/testthat/test-utils.R +++ b/tests/testthat/test-utils.R @@ -20,3 +20,98 @@ test_that("format_list", { expect_identical(format_list(list("5", "6")), "5,6") expect_identical(format_list(list("*", "*")), "*,*") }) + +test_that("check_is_cachable can handle both str and date inputs of various lengths", { + epidata_call <- list( + params = list(as_of = NULL, issues = NULL) + ) + fetch_args <- fetch_args_list() + + expect_no_error(check_is_cachable(epidata_call, fetch_args)) + + # as_of string + epidata_call$params$as_of <- "2022-01-01" + epidata_call$params$issues <- NULL + expect_no_error(check_is_cachable(epidata_call, fetch_args)) + + # as_of date + epidata_call$params$as_of <- as.Date("2022-01-01") + epidata_call$params$issues <- NULL + expect_no_error(check_is_cachable(epidata_call, fetch_args)) + + # issues single string + epidata_call$params$as_of <- NULL + epidata_call$params$issues <- "2022-01-01" + expect_no_error(check_is_cachable(epidata_call, fetch_args)) + + # issues string vector + epidata_call$params$as_of <- NULL + epidata_call$params$issues <- c("2022-01-01", "2022-02-01") + expect_no_error(check_is_cachable(epidata_call, fetch_args)) + + # issues single date + epidata_call$params$as_of <- NULL + epidata_call$params$issues <- as.Date("2022-01-01") + expect_no_error(check_is_cachable(epidata_call, fetch_args)) + + # issues date vector + epidata_call$params$as_of <- NULL + epidata_call$params$issues <- c(as.Date("2022-01-01"), as.Date("2022-02-01")) + expect_no_error(check_is_cachable(epidata_call, fetch_args)) + + # issues epirange + epidata_call$params$as_of <- NULL + epidata_call$params$issues <- epirange(as.Date("2022-01-01"), as.Date("2022-02-01")) + expect_no_error(check_is_cachable(epidata_call, fetch_args)) +}) + +test_that("check_is_recent can handle both str and date inputs of various lengths", { + # NULL + as_of <- NULL + expect_no_error(result <- check_is_recent(as_of, 10)) + expect_identical(result, FALSE) + + # as_of single string + as_of <- "2022-01-01" + expect_no_error(result <- check_is_recent(as_of, 10)) + expect_identical(result, FALSE) + + # as_of string vector + as_of <- c("2022-01-01", "3000-01-02", "3000-01-03") + expect_no_error(result <- check_is_recent(as_of, 10)) + expect_identical(result, TRUE) + + # as_of single date + as_of <- as.Date("2022-01-01") + expect_no_error(result <- check_is_recent(as_of, 10)) + expect_identical(result, FALSE) + + # as_of date vector + as_of <- as.Date(c("2022-01-01", "3000-01-02", "3000-01-03")) + expect_no_error(result <- check_is_recent(as_of, 10)) + expect_identical(result, TRUE) +}) + +test_that("get_wildcard_equivalent_dates works in basic cases", { + # Week date + result <- get_wildcard_equivalent_dates(epirange(202002, 202013), "week") + expect_identical(result, epirange(202002, 202013)) + + result <- get_wildcard_equivalent_dates(epirange("202002", "202013"), "week") + expect_identical(result, epirange("202002", "202013")) + + # Week wildcard + result <- get_wildcard_equivalent_dates("*", "week") + expect_identical(result, epirange(100001, 300001)) + + # Day date + result <- get_wildcard_equivalent_dates(epirange(20200201, 20201031), "day") + expect_identical(result, epirange(20200201, 20201031)) + + result <- get_wildcard_equivalent_dates(epirange("20200201", "20201031"), "day") + expect_identical(result, epirange("20200201", "20201031")) + + # Day wildcard + result <- get_wildcard_equivalent_dates("*", "day") + expect_identical(result, epirange(10000101, 30000101)) +}) diff --git a/vignettes/epidatr.Rmd b/vignettes/epidatr.Rmd index a2913b38..d96a2fdf 100644 --- a/vignettes/epidatr.Rmd +++ b/vignettes/epidatr.Rmd @@ -1,8 +1,10 @@ --- -title: "Delphi Epidata R API Client" -output: rmarkdown::html_vignette +title: "Get started with epidatr" +output: + rmarkdown::html_vignette: + code_folding: show vignette: > - %\VignetteIndexEntry{Delphi Epidata R API Client} + %\VignetteIndexEntry{Get started with epidatr} %\VignetteEngine{knitr::rmarkdown} %\VignetteDepends{ggplot2} \usepackage[utf8]{inputenc} @@ -11,385 +13,270 @@ vignette: > ```{r, echo = FALSE, message = FALSE} knitr::opts_chunk$set(collapse = TRUE, comment = "#>") options(tibble.print_min = 4L, tibble.print_max = 4L, max.print = 4L) -library(epidatr) -library(dplyr) ``` The epidatr package provides access to all the endpoints of the [Delphi Epidata API](https://cmu-delphi.github.io/delphi-epidata/), and can be used to make -requests for specific signals on specific dates and in selected geographic +requests for specific signals on specific dates and in select geographic regions. -We recommend you register for an API key. While most endpoints are available -without one, there are [limits on API usage for anonymous -users](https://cmu-delphi.github.io/delphi-epidata/api/api_keys.html), including -a rate limit. If you regularly request large amounts of data, please consider -[registering for an API -key](https://api.delphi.cmu.edu/epidata/admin/registration_form). You can then -specify this key by either -- setting the environment variable `DELPHI_EPIDATA_KEY`, such as by editing your - `.Renviron` file -- setting the option `delphi.epidata.key` using `options()` +## Setup -## Basic Usage +### Installation -Fetching some data from the Delphi Epidata API is simple. Suppose we are -interested in the [`covidcast` -endpoint](https://cmu-delphi.github.io/delphi-epidata/api/covidcast.html), which -provides access to a range of data on COVID-19. Reviewing the endpoint -documentation, we see that we need to specify a data source name, a signal name, -a geographic level, a time resolution, and the location and times of interest. +You can install the stable version of this package from CRAN: -In this case, the `pub_covidcast()` function lets us specify these parameters for -the endpoint and returns a tibble with the results: - -```{r} -epidata <- pub_covidcast( - "fb-survey", "smoothed_cli", "state", "day", "pa", - epirange(20210105, 20210410) -) -epidata +```R +install.packages("epidatr") +pak::pkg_install("epidatr") +renv::install("epidatr") ``` -We can then easily plot the data using ggplot2: +Or if you want the development version, install from GitHub: -```{r, out.height="65%"} -library(ggplot2) -ggplot(epidata, aes(x = time_value, y = value)) + - geom_line() + - labs( - title = "Smoothed CLI from Facebook Survey", - subtitle = "PA, 2021", - x = "Date", - y = "CLI" - ) +```R +# Install the dev version using `pak` or `remotes` +pak::pkg_install("cmu-delphi/epidatr@dev") +remotes::install_github("cmu-delphi/epidatr", ref = "dev") +renv::install("cmu-delphi/epidatr@dev") ``` -The [Delphi Epidata API documentation](https://cmu-delphi.github.io/delphi-epidata/) has more information on the available endpoints and arguments. You can also use the `avail_endpoints()` function to get a table of endpoint functions: +### API Keys -```{r} -avail_endpoints() -``` +The Delphi API requires a (free) API key for full functionality. While most +endpoints are available without one, there are +[limits on API usage for anonymous users](https://cmu-delphi.github.io/delphi-epidata/api/api_keys.html), +including a rate limit. -Example queries with all the endpoint functions available in this package are given [below](#example-queries). +To generate your key, +[register for a pseudo-anonymous account](https://api.delphi.cmu.edu/epidata/admin/registration_form). +See the `save_api_key()` function documentation for details on how to set up +`epidatr` to use your API key. -## Advanced Usage (Experimental) +_Note_ that private endpoints (i.e. those prefixed with `pvt_`) require a +separate key that needs to be passed as an argument. These endpoints require +specific data use agreements to access. -The [COVIDcast -endpoint](https://cmu-delphi.github.io/delphi-epidata/api/covidcast.html) of the -Epidata API contains many separate data sources and signals. It can be difficult -to find the name of the signal you're looking for, so you can use -`covidcast_epidata()` to get help with finding sources and functions without -leaving R. -The `covidcast_epidata()` function fetches a list of all signals, and returns an -object containing fields for every signal: +## Basic Usage -```{r} -epidata <- covidcast_epidata() -epidata$signals -``` +Fetching data from the Delphi Epidata API is simple. Suppose we are +interested in the +[`covidcast` endpoint](https://cmu-delphi.github.io/delphi-epidata/api/covidcast.html), +which provides access to a +[wide range of data](https://cmu-delphi.github.io/delphi-epidata/api/covidcast_signals.html) +on COVID-19. Reviewing the endpoint documentation, we see that we +[need to specify](https://cmu-delphi.github.io/delphi-epidata/api/covidcast.html#constructing-api-queries) +a data source name, a signal name, a geographic level, a time resolution, and +the location and times of interest. -If you use an editor that supports tab completion, such as RStudio, type -`epidata$signals$` and wait for the tab completion popup. You will be able to -type the name of signals and have the autocomplete feature select them from the -list for you. Note that some signal names have dashes in them, so to access them -we rely on the backtick operator: +The `pub_covidcast()` function lets us access the `covidcast` endpoint: ```{r} -epidata$signals$`fb-survey:smoothed_cli` -``` - -These objects can be used directly to fetch data, without requiring us to use -the `pub_covidcast()` function. Simply use the `$call` attribute of the object: +library(epidatr) +library(dplyr) -```{r} -epidata$signals$`fb-survey:smoothed_cli`$call("state", "pa", epirange(20210405, 20210410)) +# Obtain the most up-to-date version of the smoothed covid-like illness (CLI) +# signal from the COVID-19 Trends and Impact survey for the US +epidata <- pub_covidcast( + source = "fb-survey", + signals = "smoothed_cli", + geo_type = "nation", + time_type = "day", + geo_values = "us", + time_values = epirange(20210105, 20210410) +) +knitr::kable(head(epidata)) ``` -## Advanced Usage (Debugging) +`pub_covidcast()` returns a `tibble`. (Here we’re using `knitr::kable()` to make +it more readable.) Each row represents one observation in Pennsylvania on one +day. The state abbreviation is given in the `geo_value` column, the date in +the `time_value` column. Here `value` is the requested signal -- in this +case, the smoothed estimate of the percentage of people with COVID-like +illness, based on the symptom surveys, and `stderr` is its standard error. -We can obtain the [`epidata_call`] object underlying a request by setting the -`dry_run` argument to `TRUE` in `fetch_args_list()`: +The Epidata API makes signals available at different geographic levels, +depending on the endpoint. To request signals for all states instead of the +entire US, we use the `geo_type` argument paired with `*` for the +`geo_values` argument. (Only some endpoints allow for the use of `*` to +access data at all locations. Check the help for a given endpoint to see if +it supports `*`.) -```{r} +```{r, eval = FALSE} +# Obtain the most up-to-date version of the smoothed covid-like illness (CLI) +# signal from the COVID-19 Trends and Impact survey for all states pub_covidcast( - "fb-survey", "smoothed_cli", "state", "day", "pa", - epirange(20210405, 20210410), - fetch_args = fetch_args_list(dry_run = TRUE) + source = "fb-survey", + signals = "smoothed_cli", + geo_type = "state", + time_type = "day", + geo_values = "*", + time_values = epirange(20210105, 20210410) ) ``` -## Example Queries - -(Some endpoints allow for the use of `*` to access data at all locations. Check the help for a given endpoint to see if it supports `*`.) - -### COVIDcast Main Endpoint - -API docs: +We can fetch a subset of states by listing out the desired locations: -County geo_values are [FIPS codes](https://en.wikipedia.org/wiki/List_of_United_States_FIPS_codes_by_county) and are discussed in the API docs [here](https://cmu-delphi.github.io/delphi-epidata/api/covidcast_geography.html). The example below is for Orange County, California. - -```{r} +```{r, eval = FALSE} +# Obtain the most up-to-date version of the smoothed covid-like illness (CLI) +# signal from the COVID-19 Trends and Impact survey for Pennsylvania pub_covidcast( source = "fb-survey", - signals = "smoothed_accept_covid_vaccine", - geo_type = "county", + signals = "smoothed_cli", + geo_type = "state", time_type = "day", - time_values = epirange(20201221, 20201225), - geo_values = "06059" + geo_values = c("pa", "ca", "fl"), + time_values = epirange(20210105, 20210410) ) ``` -The `covidcast` endpoint supports `*` in its time and geo fields: +We can also request data for a single location at a time, via the `geo_values` argument. ```{r} -pub_covidcast( +# Obtain the most up-to-date version of the smoothed covid-like illness (CLI) +# signal from the COVID-19 Trends and Impact survey for Pennsylvania +epidata <- pub_covidcast( source = "fb-survey", - signals = "smoothed_accept_covid_vaccine", - geo_type = "county", + signals = "smoothed_cli", + geo_type = "state", time_type = "day", - time_values = epirange(20201221, 20201225), - geo_values = "*" + geo_values = "pa", + time_values = epirange(20210105, 20210410) ) +knitr::kable(head(epidata)) ``` -### Other Covid Endpoints +## Getting versioned data -#### COVID-19 Hospitalization: Facility Lookup - -API docs: +The Epidata API stores a historical record of all data, including corrections +and updates, which is particularly useful for accurately backtesting +forecasting models. To fetch versioned data, we can use the `as_of` +argument. ```{r, eval = FALSE} -pub_covid_hosp_facility_lookup(city = "southlake") -pub_covid_hosp_facility_lookup(state = "WY") -# A non-example (there is no city called New York in Wyoming) -pub_covid_hosp_facility_lookup(state = "WY", city = "New York") -``` - -#### COVID-19 Hospitalization by Facility - -API docs: - -```{r, eval = FALSE} -pub_covid_hosp_facility( - hospital_pks = "100075", - collection_weeks = epirange(20200101, 20200501) +# Obtain the smoothed covid-like illness (CLI) signal from the COVID-19 +# Trends and Impact survey for Pennsylvania as it was on 2021-06-01 +pub_covidcast( + source = "fb-survey", + signals = "smoothed_cli", + geo_type = "state", + time_type = "day", + geo_values = "pa", + time_values = epirange(20210105, 20210410), + as_of = "2021-06-01" ) ``` -#### COVID-19 Hospitalization by State - -API docs: - -```{r, eval = FALSE} -pub_covid_hosp_state_timeseries(states = "MA", dates = "20200510") -``` - -### Flu Endpoints +See `vignette("versioned-data")` for details and more ways to specify versioned data. -#### Delphi's ILINet forecasts - -API docs: - -```{r, eval = FALSE} -del <- pub_delphi(system = "ec", epiweek = 201501) -names(del[[1L]]$forecast) -``` - -#### FluSurv hospitalization data - -API docs: - -```{r, eval = FALSE} -pub_flusurv(locations = "ca", epiweeks = 202001) -``` - -#### Fluview data - -API docs: - -```{r, eval = FALSE} -pub_fluview(regions = "nat", epiweeks = epirange(201201, 202001)) -``` - -#### Fluview virological data from clinical labs - -API docs: - -```{r, eval = FALSE} -pub_fluview_clinical(regions = "nat", epiweeks = epirange(201601, 201701)) -``` -#### Fluview metadata +## Plotting -API docs: +Because the output data is in a standard `tibble` format, we can easily plot +it using `ggplot2`: -```{r, eval = FALSE} -pub_fluview_meta() -``` - -#### Google Flu Trends data - -API docs: - -```{r, eval = FALSE} -pub_gft(locations = "hhs1", epiweeks = epirange(201201, 202001)) -``` - -#### ECDC ILI - -API docs: - -```{r, eval = FALSE} -pub_ecdc_ili(regions = "Armenia", epiweeks = 201840) +```{r, out.height="65%"} +library(ggplot2) +ggplot(epidata, aes(x = time_value, y = value)) + + geom_line() + + labs( + title = "Smoothed CLI from Facebook Survey", + subtitle = "PA, 2021", + x = "Date", + y = "CLI" + ) ``` -#### KCDC ILI - -API docs: +`ggplot2` can also be used to [create choropleths](https://r-graphics.org/recipe-miscgraph-choropleth). -```{r, eval = FALSE} -pub_kcdc_ili(regions = "ROK", epiweeks = 200436) -``` -#### NIDSS Flu +```{r, class.source = "fold-hide", out.height="65%"} +library(maps) -API docs: +# Obtain the most up-to-date version of the smoothed covid-like illness (CLI) +# signal from the COVID-19 Trends and Impact survey for all states on a single day +cli_states <- pub_covidcast( + source = "fb-survey", + signals = "smoothed_cli", + geo_type = "state", + time_type = "day", + geo_values = "*", + time_values = 20210410 +) -```{r, eval = FALSE} -pub_nidss_flu(regions = "taipei", epiweeks = epirange(200901, 201301)) -``` +# Get a mapping of states to longitude/latitude coordinates +states_map <- map_data("state") -#### ILI Nearby Nowcast +# Convert state abbreviations into state names +cli_states <- mutate( + cli_states, + state = ifelse( + geo_value == "dc", + "district of columbia", + state.name[match(geo_value, tolower(state.abb))] %>% tolower() + ) +) -API docs: +# Add coordinates for each state +cli_states <- left_join(states_map, cli_states, by = c("region" = "state")) -```{r, eval = FALSE} -pub_nowcast(locations = "ca", epiweeks = epirange(202201, 202319)) +# Plot +ggplot(cli_states, aes(x = long, y = lat, group = group, fill = value)) + + geom_polygon(colour = "black", linewidth = 0.2) + + coord_map("polyconic") + + labs( + title = "Smoothed CLI from Facebook Survey", + subtitle = "All states, 2021-04-10", + x = "Longitude", + y = "Latitude" + ) ``` -### Dengue Endpoints -#### Delphi's Dengue Nowcast +## Finding locations of interest -API docs: +Most data is only available for the US. Select endpoints report other countries at the national and/or regional levels. Endpoint descriptions explicitly state when they cover non-US locations. -```{r, eval = FALSE} -pub_dengue_nowcast(locations = "pr", epiweeks = epirange(201401, 202301)) -``` +For endpoints that report US data, see the +[geographic coding documentation](https://cmu-delphi.github.io/delphi-epidata/api/covidcast_geography.html) +for available geographic levels. -#### NIDSS dengue -API docs: +### International data -```{r, eval = FALSE} -pub_nidss_dengue(locations = "taipei", epiweeks = epirange(200301, 201301)) -``` +International data is available via -### PAHO Dengue +- `pub_dengue_nowcast` (North and South America) +- `pub_ecdc_ili` (Europe) +- `pub_kcdc_ili` (Korea) +- `pub_nidss_dengue` (Taiwan) +- `pub_nidss_flu` (Taiwan) +- `pub_paho_dengue` (North and South America) +- `pvt_dengue_sensors` (North and South America) -API docs: -```{r, eval=FALSE} -pub_paho_dengue(regions = "ca", epiweeks = epirange(200201, 202319)) -``` +## Finding data sources and signals of interest -### Other Endpoints +Above we used data from [Delphi’s symptom surveys](https://delphi.cmu.edu/covid19/ctis/), +but the Epidata API includes numerous data streams: medical claims data, cases +and deaths, mobility, and many others. This can make it a challenge to find +the data stream that you are most interested in. -#### Wikipedia Access +The Epidata documentation lists all the data sources and signals available +through the API for [COVID-19](https://cmu-delphi.github.io/delphi-epidata/api/covidcast_signals.html) +and for [other diseases](https://cmu-delphi.github.io/delphi-epidata/api/README.html#source-specific-parameters). -API docs: +You can also use the `avail_endpoints()` function to get a table of endpoint functions: ```{r, eval = FALSE} -pub_wiki(language = "en", articles = "influenza", epiweeks = epirange(202001, 202319)) -``` - -### Private methods - -These require private access keys to use (separate from the Delphi Epidata API key). -To actually run these locally, you will need to store these secrets in your `.Reviron` file, or set them as environmental variables. - -#### CDC - -API docs: - -```{r, eval=FALSE} -pvt_cdc(auth = Sys.getenv("SECRET_API_AUTH_CDC"), epiweeks = epirange(202003, 202304), locations = "ma") -``` - -#### Dengue Digital Surveillance Sensors - -API docs: - -```{r, eval=FALSE} -pvt_dengue_sensors( - auth = Sys.getenv("SECRET_API_AUTH_SENSORS"), - names = "ght", - locations = "ag", - epiweeks = epirange(201404, 202004) -) -``` - -#### Google Health Trends - -API docs: - -```{r, eval=FALSE} -pvt_ght( - auth = Sys.getenv("SECRET_API_AUTH_GHT"), - epiweeks = epirange(199301, 202304), - locations = "ma", - query = "how to get over the flu" -) -``` - -#### NoroSTAT metadata - -API docs: - -```{r, eval=FALSE} -pvt_meta_norostat(auth = Sys.getenv("SECRET_API_AUTH_NOROSTAT")) -``` - -#### NoroSTAT data - -API docs: - -```{r, eval=FALSE} -pvt_norostat(auth = Sys.getenv("SECRET_API_AUTH_NOROSTAT"), locations = "1", epiweeks = 201233) -``` - -#### Quidel Influenza testing - -API docs: - -```{r, eval=FALSE} -pvt_quidel(auth = Sys.getenv("SECRET_API_AUTH_QUIDEL"), locations = "hhs1", epiweeks = epirange(200301, 202105)) +avail_endpoints() ``` -#### Sensors - -API docs: - -```{r, eval=FALSE} -pvt_sensors( - auth = Sys.getenv("SECRET_API_AUTH_SENSORS"), - names = "sar3", - locations = "nat", - epiweeks = epirange(200301, 202105) -) +```{r, echo = FALSE} +invisible(capture.output(endpts <- avail_endpoints())) +knitr::kable(endpts) ``` -#### Twitter - -API docs: - -```{r, eval=FALSE} -pvt_twitter( - auth = Sys.getenv("SECRET_API_AUTH_TWITTER"), - locations = "nat", - epiweeks = epirange(200301, 202105) -) -``` +See `vignette("signal-discovery")` for more information. diff --git a/vignettes/signal-discovery.Rmd b/vignettes/signal-discovery.Rmd new file mode 100644 index 00000000..70a081ae --- /dev/null +++ b/vignettes/signal-discovery.Rmd @@ -0,0 +1,386 @@ +--- +title: "Finding data sources and signals of interest" +output: rmarkdown::html_vignette +vignette: > + %\VignetteIndexEntry{Finding data sources and signals of interest} + %\VignetteEngine{knitr::rmarkdown} + \usepackage[utf8]{inputenc} +--- + +```{r, echo = FALSE, message = FALSE} +knitr::opts_chunk$set(collapse = TRUE, comment = "#>") +options(tibble.print_min = 4L, tibble.print_max = 4L, max.print = 4L) +library(epidatr) +library(dplyr) +``` + +The Epidata API includes numerous data streams -- medical claims data, cases and deaths, mobility, and many others -- covering different geographic regions. This can make it a challenge to find the data stream that you are most interested in. + +Example queries with all the endpoint functions available in this package are +given [below](#example-queries). + + +## Using the documentation + +The Epidata documentation lists all the data sources and signals available +through the API for +[COVID-19](https://cmu-delphi.github.io/delphi-epidata/api/covidcast_signals.html) and +for [other diseases](https://cmu-delphi.github.io/delphi-epidata/api/README.html#source-specific-parameters). +The site also includes a search tool if you have a keyword (e.g. "Taiwan") in mind. + + +## Signal metadata + +Some endpoints have partner metadata available that provides information about +the signals that are available, for example, what time ranges they are +available for, and when they have been updated. + +```{r, echo = FALSE} +suppressMessages(invisible(capture.output(endpts <- avail_endpoints()))) +filter(endpts, endsWith(Endpoint, "_meta()")) %>% knitr::kable() +``` + +## Interactive tooling + +We provide a couple `epidatr` functions to help find data sources and signals. + +The `avail_endpoints()` function lists endpoints, each of which, except for +COVIDcast, corresponds to a single data source. `avail_endpoints()` outputs a +`tibble` of endpoints and brief descriptions, which explicitly state when they +cover non-US locations: + +```{r, eval = FALSE} +avail_endpoints() +``` + +```{r, echo = FALSE} +suppressMessages(invisible(capture.output(endpts <- avail_endpoints()))) +knitr::kable(endpts) +``` + +The `covidcast_epidata()` function lets you look more in-depth at the data +sources available through the COVIDcast endpoint. The function describes +all available data sources and signals: + +```{r} +covid_sources <- covidcast_epidata() +head(covid_sources$sources, n = 2) +``` + +Each source is included as an entry in the `covid_sources$sources` list, associated +with a `tibble` describing included signals. + +If you use an editor that supports tab completion, such as RStudio, type +`covid_sources$source$` and wait for the tab completion popup. You will be able to +browse the list of data sources. + +```{r} +covid_sources$signals +``` + +If you use an editor that supports tab completion, type +`covid_sources$signals$` and wait for the tab completion popup. You will be +able to type the name of signals and have the autocomplete feature select +them from the list for you. In the tab-completion popup, signal names are +prefixed with the name of the data source for filtering convenience. + +_Note_ that some signal names have dashes in them, so to access them +we rely on the backtick operator: + +```{r} +covid_sources$signals$`fb-survey:smoothed_cli` +``` + +These signal objects can be used directly to fetch data, without requiring us to use +the `pub_covidcast()` function. Simply use the `$call` attribute of the object: + +```{r} +epidata <- covid_sources$signals$`fb-survey:smoothed_cli`$call( + "state", "pa", epirange(20210405, 20210410) +) +knitr::kable(epidata) +``` + + +## Example Queries + +### COVIDcast Main Endpoint + +API docs: + +County geo_values are [FIPS codes](https://en.wikipedia.org/wiki/List_of_United_States_FIPS_codes_by_county) and are discussed in the API docs [here](https://cmu-delphi.github.io/delphi-epidata/api/covidcast_geography.html). The example below is for Orange County, California. + +```{r} +pub_covidcast( + source = "fb-survey", + signals = "smoothed_accept_covid_vaccine", + geo_type = "county", + time_type = "day", + time_values = epirange(20201221, 20201225), + geo_values = "06059" +) +``` + +The `covidcast` endpoint supports `*` in its time and geo fields: + +```{r} +pub_covidcast( + source = "fb-survey", + signals = "smoothed_accept_covid_vaccine", + geo_type = "county", + time_type = "day", + time_values = epirange(20201221, 20201225), + geo_values = "*" +) +``` + +### Other Covid Endpoints + +#### COVID-19 Hospitalization: Facility Lookup + +API docs: + +```{r, eval = FALSE} +pub_covid_hosp_facility_lookup(city = "southlake") +pub_covid_hosp_facility_lookup(state = "WY") +# A non-example (there is no city called New York in Wyoming) +pub_covid_hosp_facility_lookup(state = "WY", city = "New York") +``` + +#### COVID-19 Hospitalization by Facility + +API docs: + +```{r, eval = FALSE} +pub_covid_hosp_facility( + hospital_pks = "100075", + collection_weeks = epirange(20200101, 20200501) +) +``` + +#### COVID-19 Hospitalization by State + +API docs: + +```{r, eval = FALSE} +pub_covid_hosp_state_timeseries(states = "MA", dates = "20200510") +``` + +### Flu Endpoints + +#### Delphi's ILINet forecasts + +API docs: + +```{r, eval = FALSE} +del <- pub_delphi(system = "ec", epiweek = 201501) +names(del[[1L]]$forecast) +``` + +#### FluSurv hospitalization data + +API docs: + +```{r, eval = FALSE} +pub_flusurv(locations = "ca", epiweeks = 202001) +``` + +#### Fluview data + +API docs: + +```{r, eval = FALSE} +pub_fluview(regions = "nat", epiweeks = epirange(201201, 202001)) +``` + +#### Fluview virological data from clinical labs + +API docs: + +```{r, eval = FALSE} +pub_fluview_clinical(regions = "nat", epiweeks = epirange(201601, 201701)) +``` + +#### Fluview metadata + +API docs: + +```{r, eval = FALSE} +pub_fluview_meta() +``` + +#### Google Flu Trends data + +API docs: + +```{r, eval = FALSE} +pub_gft(locations = "hhs1", epiweeks = epirange(201201, 202001)) +``` + +#### ECDC ILI + +API docs: + +```{r, eval = FALSE} +pub_ecdc_ili(regions = "Armenia", epiweeks = 201840) +``` + +#### KCDC ILI + +API docs: + +```{r, eval = FALSE} +pub_kcdc_ili(regions = "ROK", epiweeks = 200436) +``` + +#### NIDSS Flu + +API docs: + +```{r, eval = FALSE} +pub_nidss_flu(regions = "taipei", epiweeks = epirange(200901, 201301)) +``` + +#### ILI Nearby Nowcast + +API docs: + +```{r, eval = FALSE} +pub_nowcast(locations = "ca", epiweeks = epirange(202201, 202319)) +``` + +### Dengue Endpoints + +#### Delphi's Dengue Nowcast + +API docs: + +```{r, eval = FALSE} +pub_dengue_nowcast(locations = "pr", epiweeks = epirange(201401, 202301)) +``` + +#### NIDSS dengue + +API docs: + +```{r, eval = FALSE} +pub_nidss_dengue(locations = "taipei", epiweeks = epirange(200301, 201301)) +``` + +### PAHO Dengue + +API docs: + +```{r, eval=FALSE} +pub_paho_dengue(regions = "ca", epiweeks = epirange(200201, 202319)) +``` + +### Other Endpoints + +#### Wikipedia Access + +API docs: + +```{r, eval = FALSE} +pub_wiki( + language = "en", + articles = "influenza", + time_type = "week", + time_values = epirange(202001, 202319) +) +``` + +### Private methods + +These require private access keys to use (separate from the Delphi Epidata API key). +To actually run these locally, you will need to store these secrets in your `.Reviron` file, or set them as environmental variables. + +
+ +Usage of private endpoints + +#### CDC + +API docs: + +```{r, eval=FALSE} +pvt_cdc(auth = Sys.getenv("SECRET_API_AUTH_CDC"), epiweeks = epirange(202003, 202304), locations = "ma") +``` + +#### Dengue Digital Surveillance Sensors + +API docs: + +```{r, eval=FALSE} +pvt_dengue_sensors( + auth = Sys.getenv("SECRET_API_AUTH_SENSORS"), + names = "ght", + locations = "ag", + epiweeks = epirange(201404, 202004) +) +``` + +#### Google Health Trends + +API docs: + +```{r, eval=FALSE} +pvt_ght( + auth = Sys.getenv("SECRET_API_AUTH_GHT"), + epiweeks = epirange(199301, 202304), + locations = "ma", + query = "how to get over the flu" +) +``` + +#### NoroSTAT metadata + +API docs: + +```{r, eval=FALSE} +pvt_meta_norostat(auth = Sys.getenv("SECRET_API_AUTH_NOROSTAT")) +``` + +#### NoroSTAT data + +API docs: + +```{r, eval=FALSE} +pvt_norostat(auth = Sys.getenv("SECRET_API_AUTH_NOROSTAT"), locations = "1", epiweeks = 201233) +``` + +#### Quidel Influenza testing + +API docs: + +```{r, eval=FALSE} +pvt_quidel(auth = Sys.getenv("SECRET_API_AUTH_QUIDEL"), locations = "hhs1", epiweeks = epirange(200301, 202105)) +``` + +#### Sensors + +API docs: + +```{r, eval=FALSE} +pvt_sensors( + auth = Sys.getenv("SECRET_API_AUTH_SENSORS"), + names = "sar3", + locations = "nat", + epiweeks = epirange(200301, 202105) +) +``` + +#### Twitter + +API docs: + +```{r, eval=FALSE} +pvt_twitter( + auth = Sys.getenv("SECRET_API_AUTH_TWITTER"), + locations = "nat", + time_type = "week", + time_values = epirange(200301, 202105) +) +``` + +
diff --git a/vignettes/versioned-data.Rmd b/vignettes/versioned-data.Rmd new file mode 100644 index 00000000..27271c6c --- /dev/null +++ b/vignettes/versioned-data.Rmd @@ -0,0 +1,163 @@ +--- +title: "Understanding and accessing versioned data" +output: rmarkdown::html_vignette +vignette: > + %\VignetteIndexEntry{Understanding and accessing versioned data} + %\VignetteEngine{knitr::rmarkdown} + \usepackage[utf8]{inputenc} +--- + +```{r, echo = FALSE, message = FALSE} +knitr::opts_chunk$set(collapse = TRUE, comment = "#>") +options(tibble.print_min = 4L, tibble.print_max = 4L, max.print = 4L) +library(epidatr) +library(dplyr) +``` + + +The Epidata API records not just each signal's estimate for a given location +on a given day, but also *when* that estimate was made, and all updates to that +estimate. + +For example, let's look at the [doctor visits +signal](https://cmu-delphi.github.io/delphi-epidata/api/covidcast-signals/doctor-visits.html) +from the [`covidcast` endpoint](https://cmu-delphi.github.io/delphi-epidata/api/covidcast.html), +which estimates the percentage of outpatient doctor visits that are +COVID-related. Consider a result row with `time_value` 2020-05-01 for +`geo_values = "pa"`. This is an estimate for Pennsylvania on +May 1, 2020. That estimate was *issued* on May 5, 2020, the delay being due to +the aggregation of data by our source and the time taken by the Epidata API to +ingest the data provided. Later, the estimate for May 1st could be updated, +perhaps because additional visit data from May 1st arrived at our source and was +reported to us. This constitutes a new *issue* of the data. + + +### Data known "as of" a specific date + +By default, endpoint functions fetch the most recent issue available. This +is the best option for users who simply want to graph the latest data or +construct dashboards. But if we are interested in knowing *when* data was +reported, we can request specific data versions using the `as_of`, `issues`, or +`lag` arguments. + +_Note_ that these are mutually exclusive; only one can be specified +at a time. Also, not all endpoints support all three parameters, so please +check the documentation for that specific endpoint. + +First, we can request the data that was available *as of* a specific date, using +the `as_of` argument: + + +```{r} +epidata <- pub_covidcast( + source = "doctor-visits", + signals = "smoothed_adj_cli", + time_type = "day", + time_values = epirange("2020-05-01", "2020-05-01"), + geo_type = "state", + geo_values = "pa", + as_of = "2020-05-07" +) +knitr::kable(epidata) +``` + +This shows that an estimate of about 2.3% was issued on May 7. If we don't +specify `as_of`, we get the most recent estimate available: + + +```{r} +epidata <- pub_covidcast( + source = "doctor-visits", + signals = "smoothed_adj_cli", + time_type = "day", + time_values = epirange("2020-05-01", "2020-05-01"), + geo_type = "state", + geo_values = "pa" +) +knitr::kable(epidata) +``` + +Note the substantial change in the estimate, from less than 3% to almost 6%, +reflecting new data that became available after May 7 about visits *occurring on* +May 1. This illustrates the importance of issue date tracking, particularly +for forecasting tasks. To backtest a forecasting model on past data, it is +important to use the data that would have been available *at the time* the model +was or would have been fit, not data that arrived much later. + + +### Multiple issues of observations + +By using the `issues` argument, we can request all issues in a certain time +period: + +```{r} +epidata <- pub_covidcast( + source = "doctor-visits", + signals = "smoothed_adj_cli", + time_type = "day", + time_values = epirange("2020-05-01", "2020-05-01"), + geo_type = "state", + geo_values = "pa", + issues = epirange("2020-05-01", "2020-05-15") +) +knitr::kable(epidata) +``` + +This estimate was clearly updated many times as new data for May 1st arrived. + +Note that these results include only data issued or updated between +(inclusive) 2020-05-01 and 2020-05-15. If a value was first reported on +2020-04-15, and never updated, a query for issues between 2020-05-01 and +2020-05-15 will not include that value among its results. + +The `issues` parameter also accepts a list of dates. + +```{r, eval = FALSE} +pub_covidcast( + source = "doctor-visits", + signals = "smoothed_adj_cli", + time_type = "day", + time_values = epirange("2020-05-01", "2020-05-01"), + geo_type = "state", + geo_values = "pa", + issues = c("2020-05-07", "2020-05-09", "2020-05-15") +) +``` + + +### Observations issued with a specific lag + +Finally, we can use the `lag` argument to request only data reported with a +certain lag. For example, requesting a lag of 7 days fetches only data issued +exactly 7 days after the corresponding `time_value`: + +```{r} +epidata <- pub_covidcast( + source = "doctor-visits", + signals = "smoothed_adj_cli", + time_type = "day", + time_values = epirange("2020-05-01", "2020-05-07"), + geo_type = "state", + geo_values = "pa", + lag = 7 +) +knitr::kable(epidata) +``` + +Note that though this query requested all values between 2020-05-01 and +2020-05-07, May 3rd and May 4th were *not* included in the results set. This is +because the query will only include a result for May 3rd if a value were issued +on May 10th (a 7-day lag), but in fact the value was not updated on that day: + +```{r} +epidata <- pub_covidcast( + source = "doctor-visits", + signals = "smoothed_adj_cli", + time_type = "day", + time_values = epirange("2020-05-03", "2020-05-03"), + geo_type = "state", + geo_values = "pa", + issues = epirange("2020-05-09", "2020-05-15") +) +knitr::kable(epidata) +```