stRoke/R/quantile_cut.R

44 lines
1.6 KiB
R
Raw Normal View History

2022-09-22 15:45:40 +02:00
#' Easy function for splitting numeric variable in quantiles
#'
#' Using base/stats functions cut() and quantile().
2022-09-23 09:14:47 +02:00
#'
2022-09-22 15:45:40 +02:00
#' @param x Variable to cut.
#' @param groups Number of groups.
#' @param y alternative vector to draw quantile cuts from. Limits has to be within x. Default is NULL.
#' @param na.rm Remove NA's. Default is TRUE.
#' @param group.names Names of groups to split to. Default is NULL, giving intervals as names.
#' @param ordered.f Set resulting vector as ordered. Default is FALSE.
2022-09-23 12:05:32 +02:00
#' @param detail.list flag to include details or not
2022-09-22 15:45:40 +02:00
#' @param inc.outs Flag to include min(x) and max(x) as boarders in case of y!=NULL.
2022-09-23 09:14:47 +02:00
#'
2022-09-23 12:05:32 +02:00
#' @return vector or list with vector and details (length 2)
2022-09-23 09:14:47 +02:00
#'
2022-09-22 15:45:40 +02:00
#' @keywords quantile
#' @export
#' @examples
#' aa <- as.numeric(sample(1:1000,2000,replace = TRUE))
#' x <- 1:450
#' y <- 6:750
2022-09-23 09:14:47 +02:00
#' summary(quantile_cut(aa,groups=4,detail.list=FALSE)) ## Cuts quartiles
2023-01-11 12:54:08 +01:00
quantile_cut<-function (x, groups, y=NULL, na.rm = TRUE,
group.names = NULL, ordered.f = FALSE, inc.outs=FALSE,
detail.list=FALSE){
2022-09-22 15:45:40 +02:00
if (!is.null(y)){
2023-01-11 12:54:08 +01:00
q<-quantile(y, probs = seq(0, 1, 1/groups), na.rm = na.rm,
names = TRUE, type = 7)
if (inc.outs){ # Setting cut borders to include outliers in x compared to y.
2022-09-22 15:45:40 +02:00
q[1]<-min(x,na.rm = TRUE)
q[length(q)]<-max(x,na.rm = TRUE)
}
}
if (is.null(y)){
2023-01-11 12:54:08 +01:00
q<-quantile(x, probs = seq(0, 1, 1/groups), na.rm = na.rm,
names = TRUE, type = 7)
2022-09-22 15:45:40 +02:00
}
d<-cut(x, q, include.lowest = TRUE, labels = group.names,
ordered_result = ordered.f)
2022-09-23 09:14:47 +02:00
if (detail.list) list(d,q) else d
2022-09-22 15:45:40 +02:00
}