REDCapCAST/R/read_redcap_tables.R

118 lines
3.6 KiB
R
Raw Normal View History

2023-02-28 09:54:03 +01:00
#' Download REDCap data
#'
#' Implementation of REDCap_split with a focused data acquisition approach using
#' REDCapR::redcap_read and only downloading specified fields, forms and/or
2023-04-13 10:57:04 +02:00
#' events using the built-in focused_metadata including some clean-up.
#' Works with classical and longitudinal projects with or without repeating
#' instruments.
2023-02-28 09:54:03 +01:00
#' @param uri REDCap database uri
#' @param token API token
#' @param records records to download
#' @param fields fields to download
#' @param events events to download
#' @param forms forms to download
#' @param raw_or_label raw or label tags
2023-04-13 10:57:04 +02:00
#' @param split_forms Whether to split "repeating" or "all" forms, default is
#' all.
2023-02-28 09:54:03 +01:00
#' @param generics vector of auto-generated generic variable names to
#' ignore when discarding empty rows
#'
#' @return list of instruments
2023-03-06 14:37:06 +01:00
#' @importFrom REDCapR redcap_metadata_read redcap_read redcap_event_instruments
#' @include utils.r
2023-02-28 09:54:03 +01:00
#' @export
#'
#' @examples
#' # Examples will be provided later
read_redcap_tables <- function(uri,
token,
records = NULL,
fields = NULL,
events = NULL,
forms = NULL,
raw_or_label = "label",
split_forms = "all",
2023-02-28 09:54:03 +01:00
generics = c(
"record_id",
"redcap_event_name",
"redcap_repeat_instrument",
"redcap_repeat_instance"
2023-03-06 14:37:06 +01:00
)) {
m <- REDCapR::redcap_metadata_read(redcap_uri = uri, token = token)[["data"]]
if (!is.null(fields)){
fields_test <- fields %in% unique(m$field_name)
if (any(!fields_test)){
print(paste0("The following field names are invalid: ", paste(fields[!fields_test],collapse=", "),"."))
stop("Not all supplied field names are valid")
}
}
2023-03-06 14:37:06 +01:00
if (!is.null(forms)){
2023-03-06 14:37:06 +01:00
forms_test <- forms %in% unique(m$form_name)
2023-03-06 14:37:06 +01:00
if (any(!forms_test)){
print(paste0("The following form names are invalid: ", paste(forms[!forms_test],collapse=", "),"."))
stop("Not all supplied form names are valid")
2023-03-06 14:37:06 +01:00
}
}
if (!is.null(events)){
arm_event_inst <- REDCapR::redcap_event_instruments(redcap_uri = uri,
token = token)
2023-03-06 14:37:06 +01:00
event_test <- events %in% unique(arm_event_inst$data$unique_event_name)
if (any(!event_test)){
print(paste0("The following event names are invalid: ", paste(events[!event_test],collapse=", "),"."))
2023-03-06 14:37:06 +01:00
stop("Not all supplied event names are valid")
}
}
2023-02-28 09:54:03 +01:00
# Getting dataset
2023-02-28 13:59:45 +01:00
d <- REDCapR::redcap_read(
2023-02-28 09:54:03 +01:00
redcap_uri = uri,
token = token,
fields = fields,
events = events,
forms = forms,
records = records,
2023-03-06 14:37:06 +01:00
raw_or_label = raw_or_label
)[["data"]]
2023-02-28 09:54:03 +01:00
# Process repeat instrument naming
2023-04-13 10:57:04 +02:00
# Removes any extra characters other than a-z, 0-9 and "_", to mimic raw
# instrument names.
if ("redcap_repeat_instrument" %in% names(d)) {
d$redcap_repeat_instrument <- clean_redcap_name(d$redcap_repeat_instrument)
}
# Getting metadata
2023-02-28 09:54:03 +01:00
m <-
REDCapR::redcap_metadata_read (redcap_uri = uri, token = token)[["data"]]
# Processing metadata to reflect dataset
if (!is.null(c(fields,forms,events))){
m <- focused_metadata(m,names(d))
}
# Splitting
l <- REDCap_split(d,
m,
forms = split_forms,
primary_table_name = "")
# Sanitizing split list by removing completely empty rows apart from colnames
# in "generics"
sanitize_split(l,generics)
2023-02-28 09:54:03 +01:00
}