Creates get_multi_ona_data (#10)

This solves #10 and produces `get_multi_ona_data` function for users to download multiple ONA data into a single dataframe.
WorldHealthOrganization · Apr 29, 2024 · 35c4401 · 35c4401
1 parent e3231ac
commit 35c4401
Show file tree

Hide file tree

Showing 4 changed files with 86 additions and 1 deletion.
diff --git a/DESCRIPTION b/DESCRIPTION
@@ -30,7 +30,8 @@ Imports:
   jsonlite,
   tidyselect,
   httpcode,
-  tibble
+  tibble,
+  pbmcapply
 Suggests: 
   testthat,
   withr,

diff --git a/NAMESPACE b/NAMESPACE
@@ -1,5 +1,6 @@
 # Generated by roxygen2: do not edit by hand
 
+export(get_multi_ona_data)
 export(get_ona_data)
 export(prep_geonames)
 export(prep_match_datatypes)

diff --git a/R/get_ona.R b/R/get_ona.R
@@ -231,3 +231,57 @@ get_ona_data <- function(
   return(results)
 }
 
+#' Get Data from ONA for Multiple Forms
+#'
+#' This function retrieves data for a specified form from the ONA API using a 
+#' provided API token and constructs a unique key for each dataset. It returns 
+#' the data in a structured format if the request is successful.
+#'
+#' @param base_url The base URL for the ONA API; defaults to 
+#'            'https://api.whonghub.org'.
+#' @param form_ids A vector containing form id number to identify each form.
+#' @param api_token A string specifying the API token for ONA.
+#'
+#' @return A data frame containing the combined data from all specified form 
+#'        IDs, and includes from_id column.
+#' @examples
+#' # api_token <- "your_api_token_here"
+#' # data <- get_multi_ona_data(form_ids = c(623, 432, 643), api_token)
+#' @export
+get_multi_ona_data <- function(
+    base_url = "https://api.whonghub.org", form_ids, api_token) {
+
+  # Check if the form IDs are available for download ---------------------------
+  resp_data <- prep_ona_data_endpoints(
+    base_url = base_url,
+    api_token = api_token
+  )
+
+  if (!all(form_ids %in% unique(resp_data$id))) {
+    missing_ids <- form_ids[!form_ids %in% unique(resp_data$id)]
+    cli::cli_abort(
+      paste0("Form IDs ", 
+             toString(missing_ids), 
+             " not found. Use `prep_ona_data_endpoints()` ",
+             "to check available forms for download.")
+    )
+  }
+
+  # Fetch data in parallel for each form ID ------------------------------------
+  results_list <- pbmcapply::pbmclapply(
+    form_ids,
+    function(form_id) {
+      get_ona_data(form_id = form_id, api_token = api_token)
+    },
+    mc.cores = parallel::detectCores() - 1
+  )
+
+  # Set names for each element in the results list to match form_ids
+  names(results_list) <- as.character(form_ids)
+
+  # Combine all into one df
+  combined_data <- dplyr::bind_rows(results_list, .id = "form_id")
+
+  return(combined_data)
+}
+
diff --git a/man/get_multi_ona_data.Rd b/man/get_multi_ona_data.Rd