new function pase_calc() with sample data and a version bump

2025-04-18 04:13:54 +02:00 · 2023-06-30 11:50:50 +02:00 · 2023-06-30 11:50:50 +02:00 · 1b3f5b6eeb
commit 1b3f5b6eeb
parent ec7bb2c349
10 changed files with 308 additions and 1 deletions
--- a/2
+++ b/2
@ -1,6 +1,6 @@
 Package: stRoke
 Title: Clinical Stroke Research
-Version: 23.6.1
+Version: 23.6.2
 Authors@R: 
    person("Andreas Gammelgaard", "Damsbo", , "agdamsbo@clin.au.dk", role = c("aut", "cre"),
           comment = c(ORCID = "0000-0002-7559-1154"))
--- a/1
+++ b/1
@ -13,6 +13,7 @@ export(files_filter)
 export(generic_stroke)
 export(index_plot)
 export(label_select)
 export(pase_calc)
 export(quantile_cut)
 export(source_lines)
 export(win_prob)
--- a/NEWS.md
+++ b/NEWS.md
@ -1,3 +1,13 @@
 # stRoke 23.6.2
 ### Functions:
 * NEW: `pase_calc()` function calculates PASE scores from raw questionnaire data. Gives sub scores as well and returns basic data quality and completeness checks. Acknowledges the difference between the scoring manual and the article by Washburn PA. et al. (1999) on including sitting work in the score calculations.
 ### Data:
 * NEW: `pase` sample questionnaire data. Non-identifiable and for use with the `pase_calc()` function.
 # stRoke 23.6.1
 ### Functions:
--- a/R/pase.R
+++ b/R/pase.R
@ -0,0 +1,32 @@
 #' Data frame with sample data of PASE score questionnaire
 #'
 #' Contains non-identifiable organic trial data.
 #' Sample data labels are in Danish.
 #'
 #' @format A data frame with 200 rows and 21 variables:
 #' \describe{
 #'   \item{sample_pase01}{item 01, factor}
 #'   \item{sample_pase01b}{item 01b, factor}
 #'   \item{sample_pase02}{item 02, factor}
 #'   \item{sample_pase02a}{item 02a, factor}
 #'   \item{sample_pase03}{item 03, factor}
 #'   \item{sample_pase03b}{item 03b, factor}
 #'   \item{sample_pase04}{item 04, factor}
 #'   \item{sample_pase04b}{item 04b, factor}
 #'   \item{sample_pase05}{item 05, factor}
 #'   \item{sample_pase05b}{item 05b, factor}
 #'   \item{sample_pase06}{item 06, factor}
 #'   \item{sample_pase06b}{item 06b, factor}
 #'   \item{sample_pase07}{item 07, factor}
 #'   \item{sample_pase08}{item 08, factor}
 #'   \item{sample_pase09a}{item 09a, factor}
 #'   \item{sample_pase09b}{item 09b, factor}
 #'   \item{sample_pase09c}{item 09c, factor}
 #'   \item{sample_pase09d}{item 09d, factor}
 #'   \item{sample_pase10}{item 10, factor}
 #'   \item{sample_pase10a}{item 10a, numeric}
 #'   \item{sample_pase10b}{item 10b, factor}
 #' }
 #' @usage data(pase)
 "pase"
--- a/R/pase_calc.R
+++ b/R/pase_calc.R
@ -0,0 +1,171 @@
 #' PASE score calculator
 #' 
 #' Calculates PASE score from raw questionnaire data.
 #' @param ds data set
 #' @param adjust_work flag to set whether to include 10b type 1. 
 #' Default is TRUE.
 #'
 #' @return data.frame
 #' @export
 #' @details
 #' Labelling should be as defined by the questionnaire.
 #' 02-06 should start with 0:3, 02a-06b should start with 1:4.
 #' 
 #' ## Regarding work scoring
 #' The score calculation manual available for the PASE questionnaire, all types
 #' of work should be included. According to the article by 
 #' Washburn RA. et al (1999) sitting work is not included in the item 10 score.
 #' This differentiation is added with the option to set `adjust_work` to
 #' exclude item 10b category 1 work (set `TRUE`).
 #' 
 #' ## Regarding output
 #' Output includes sub scores as well as sums, but also to columns assessing data 
 #' quality and completeness. If any field has not been filled, `score_incompletes`
 #' will return `TRUE`. If all measures are missing `score_missings` is `TRUE`.
 #' If `adjust_work==TRUE`, 10b has to be filled, or `score_incompletes` will be
 #' set `TRUE`.
 #' 
 #' @examples
 #' summary(pase_calc(stRoke::pase)[,13])
 #' 
 pase_calc <- function(ds, adjust_work = FALSE) {
  if (ncol(ds) != 21) stop("supplied data set has to contain exactly 21 columns")
  pase <- ds
  ## Classify all as characters
  ## Labelling should be as defined by the questionnaire.
  ## 02-06 should start with 0:3, 02a-06b should start with 1:4.
  pase <- do.call(data.frame, lapply(pase, as.character))
  ## Missings and incompletes
  missings <- apply(apply(ds, 2, is.na), 1, all)
  incompletes <-
    apply(sapply(ds[, c(1, 3, 5, 7, 9, 11, 13:20)], function(x) {
      x == "Not available" | is.na(x)
    }), 1, any)
  names(pase) <- c(
    "pase01",
    "pase01b",
    "pase02",
    "pase02a",
    "pase03",
    "pase03b",
    "pase04",
    "pase04b",
    "pase05",
    "pase05b",
    "pase06",
    "pase06b",
    "pase07",
    "pase08",
    "pase09a",
    "pase09b",
    "pase09c",
    "pase09d",
    "pase10",
    "pase10a",
    "pase10b"
  )
  pase_list <- lapply(unique(substr(names(pase), 5, 6)), function(x) {
    pase[grepl(x, substr(names(pase), 5, 6))]
  })
  names(pase_list) <- unique(substr(names(pase), 5, 6))
  ## PASE 2-6
  pase_weigths <- list(
    "1" = c(
      "1" = 0.11,
      "2" = 0.32,
      "3" = 0.64,
      "4" = 1.07
    ),
    "2" = c(
      "1" = 0.25,
      "2" = 0.75,
      "3" = 1.5,
      "4" = 2.5
    ),
    "3" = c(
      "1" = 0.43,
      "2" = 1.29,
      "3" = 2.57,
      "4" = 4.29
    )
  )
  ## Multiplication factors
  pase_multip_26 <- c(20, 21, 23, 23, 30)
  pase_score_26 <- lapply(seq_along(pase_list[2:6]), function(x) {
    df <- pase_list[2:6][[x]]
    score <- c()
    ## =====================
    ## Checking labelling
    if (!all(range(suppressWarnings(as.numeric(substr(
      df[, 1], 1, 1
    ))), na.rm = TRUE) == c(0, 3))) {
      stop("Labelling of 02-06 should start with a number ranging 1-4")
    }
    ## =====================
    for (i in seq_len(nrow(df))) {
      # Setting categories from numbers
      n1 <- suppressWarnings(as.numeric(substr(df[, 1][i], 1, 1)))
      # Using if statement to calculate row wise
      if (n1 %in% c(1:3)) {
        # Second category
        n2 <- suppressWarnings(as.numeric(substr(df[, 2][i], 1, 1)))
        score[i] <- pase_weigths[[n1]][n2] * pase_multip_26[x] 
      } else if (n1 %in% 0) {
        score[i] <- 0
      } else {
        score[i] <- NA
      }
    }
    score
  })
  names(pase_score_26) <- paste0("score_", names(pase_list[2:6]))
  ## PASE 7-9d
  pase_multip_79 <- c(25, 25, 30, 36, 20, 35)
  pase_score_79 <-
    data.frame(t(t(
      sapply(Reduce(cbind,pase_list[7:9]),function(j){
        grepl("[Jj]a",j)
      }) + 0 # short hand logic to numeric
    ) * pase_multip_79))
  names(pase_score_79) <-
    paste0("score_", sub("pase", "", names(pase_score_79)))
  ## PASE 10
  ## Completely ignores if 10b is not completed
  pase_score_10 <- 21 * suppressWarnings(as.numeric(pase_list[[10]][[2]])) / 7
  if (adjust_work){
    # Only includes work time if 10b is != 1
    pase_score_10[substr(pase_list[[10]][[3]],1,1) == "1"] <- 0
    # Consequently consider "Not available" in 10b as incomplete
    incompletes[ds[,21] == "Not available" & !incompletes & !is.na(incompletes)] <- TRUE
  }
  pase_score <- cbind(pase_score_26, pase_score_79, pase_score_10)
  data.frame(
    pase_score,
    score_sum = rowSums(pase_score, na.rm = TRUE),
    score_missings = missings,
    score_incompletes = incompletes
  )
 }
--- a/data/pase.rda
+++ b/data/pase.rda
--- a/inst/WORDLIST
+++ b/inst/WORDLIST
@ -1,4 +1,5 @@
 Andreas
 CMD
 Changelog
 Codecov
 DDMMYY
@ -7,11 +8,13 @@ DataDictionary
 Gammelgaard
 Github
 Kraglund
 Labelling
 METACRAN
 NA's
 OLR
 ORCID
 OpenAI's
 PASE
 REDCap
 REDCapRITS
 RStudio
@ -21,6 +24,7 @@ StackOverflow
 Sys
 TALOS
 Vectorised
 Washburn
 XXXX
 Zou
 agdamsbo
--- a/man/pase.Rd
+++ b/man/pase.Rd
@ -0,0 +1,40 @@
 % Generated by roxygen2: do not edit by hand
 % Please edit documentation in R/pase.R
 \docType{data}
 \name{pase}
 \alias{pase}
 \title{Data frame with sample data of PASE score questionnaire}
 \format{
 A data frame with 200 rows and 21 variables:
 \describe{
 \item{sample_pase01}{item 01, factor}
 \item{sample_pase01b}{item 01b, factor}
 \item{sample_pase02}{item 02, factor}
 \item{sample_pase02a}{item 02a, factor}
 \item{sample_pase03}{item 03, factor}
 \item{sample_pase03b}{item 03b, factor}
 \item{sample_pase04}{item 04, factor}
 \item{sample_pase04b}{item 04b, factor}
 \item{sample_pase05}{item 05, factor}
 \item{sample_pase05b}{item 05b, factor}
 \item{sample_pase06}{item 06, factor}
 \item{sample_pase06b}{item 06b, factor}
 \item{sample_pase07}{item 07, factor}
 \item{sample_pase08}{item 08, factor}
 \item{sample_pase09a}{item 09a, factor}
 \item{sample_pase09b}{item 09b, factor}
 \item{sample_pase09c}{item 09c, factor}
 \item{sample_pase09d}{item 09d, factor}
 \item{sample_pase10}{item 10, factor}
 \item{sample_pase10a}{item 10a, numeric}
 \item{sample_pase10b}{item 10b, factor}
 }
 }
 \usage{
 data(pase)
 }
 \description{
 Contains non-identifiable organic trial data.
 Sample data labels are in Danish.
 }
 \keyword{datasets}
--- a/man/pase_calc.Rd
+++ b/man/pase_calc.Rd
@ -0,0 +1,45 @@
 % Generated by roxygen2: do not edit by hand
 % Please edit documentation in R/pase_calc.R
 \name{pase_calc}
 \alias{pase_calc}
 \title{PASE score calculator}
 \usage{
 pase_calc(ds, adjust_work = FALSE)
 }
 \arguments{
 \item{ds}{data set}
 \item{adjust_work}{flag to set whether to include 10b type 1.
 Default is TRUE.}
 }
 \value{
 data.frame
 }
 \description{
 Calculates PASE score from raw questionnaire data.
 }
 \details{
 Labelling should be as defined by the questionnaire.
 02-06 should start with 0:3, 02a-06b should start with 1:4.
 \subsection{Regarding work scoring}{
 The score calculation manual available for the PASE questionnaire, all types
 of work should be included. According to the article by
 Washburn RA. et al (1999) sitting work is not included in the item 10 score.
 This differentiation is added with the option to set \code{adjust_work} to
 exclude item 10b category 1 work (set \code{TRUE}).
 }
 \subsection{Regarding output}{
 Output includes sub scores as well as sums, but also to columns assessing data
 quality and completeness. If any field has not been filled, \code{score_incompletes}
 will return \code{TRUE}. If all measures are missing \code{score_missings} is \code{TRUE}.
 If \code{adjust_work==TRUE}, 10b has to be filled, or \code{score_incompletes} will be
 set \code{TRUE}.
 }
 }
 \examples{
 summary(pase_calc(stRoke::pase)[,13])
 }
--- a/tests/testthat/test-pase_calc.R
+++ b/tests/testthat/test-pase_calc.R
@ -0,0 +1,4 @@
 test_that("pase_calc works", {
  expect_equal(median(pase_calc(stRoke::pase)[,13],na.rm=TRUE), 128.625)
  expect_equal(median(pase_calc(stRoke::pase,TRUE)[,13],na.rm=TRUE), 116.2)
 })