Hao Zhu | 5fe235c | 2020-08-26 00:26:49 -0400 | [diff] [blame] | 1 | #' Helper functions to generate inline sparklines |
| 2 | #' |
| 3 | #' @description These functions helps you quickly generate sets of sparkline |
Bill Evans | 5a383e5 | 2020-08-30 20:09:52 -0700 | [diff] [blame] | 4 | #' style plots using base R plotting system. Currently, we support histogram, |
Bill Evans | cebc971 | 2020-08-30 19:55:24 -0700 | [diff] [blame] | 5 | #' boxplot, and line. You can use them together with `column_spec` to |
Hao Zhu | 5fe235c | 2020-08-26 00:26:49 -0400 | [diff] [blame] | 6 | #' generate inline plot in tables. By default, this function will save images |
| 7 | #' in a folder called "kableExtra" and return the address of the file. |
| 8 | #' |
| 9 | #' @param x Vector of values or List of vectors of values. |
| 10 | #' @param width The width of the plot in pixel |
| 11 | #' @param height The height of the plot in pixel |
| 12 | #' @param res The resolution of the plot. Default is 300. |
| 13 | #' @param same_lim T/F. If x is a list of vectors, should all the plots be |
| 14 | #' plotted in the same range? Default is True. |
Hao Zhu | defd189 | 2020-09-09 00:08:09 -0400 | [diff] [blame] | 15 | #' @param lim Manually specify plotting range in the form of |
| 16 | #' `c(0, 10)`. |
Hao Zhu | 5fe235c | 2020-08-26 00:26:49 -0400 | [diff] [blame] | 17 | #' @param xaxt On/Off for xaxis text |
| 18 | #' @param yaxt On/Off for yaxis text |
| 19 | #' @param ann On/Off for annotations (titles and axis titles) |
| 20 | #' @param col Color for the fill of the histogram bar/boxplot box. |
| 21 | #' @param border Color for the border. |
| 22 | #' @param dir Directory of where the images will be saved. |
| 23 | #' @param file File name. If not provided, a random name will be used |
| 24 | #' @param file_type Graphic device. Support `png` or `svg`. SVG is recommended |
| 25 | #' for HTML output |
Hao Zhu | defd189 | 2020-09-09 00:08:09 -0400 | [diff] [blame] | 26 | #' @param ... extra parameters sending to `hist()` |
Hao Zhu | 5fe235c | 2020-08-26 00:26:49 -0400 | [diff] [blame] | 27 | #' |
Hao Zhu | 5fe235c | 2020-08-26 00:26:49 -0400 | [diff] [blame] | 28 | #' @export |
| 29 | spec_hist <- function(x, width = 200, height = 50, res = 300, |
| 30 | breaks = "Sturges", |
| 31 | same_lim = TRUE, lim = NULL, |
| 32 | xaxt = 'n', yaxt = 'n', ann = FALSE, |
| 33 | col = "lightgray", border = NULL, |
| 34 | dir = if (is_latex()) rmd_files_dir() else tempdir(), |
| 35 | file = NULL, |
| 36 | file_type = if (is_latex()) "png" else "svg", ...) { |
| 37 | if (is.list(x)) { |
| 38 | if (same_lim & is.null(lim)) { |
| 39 | lim <- base::range(unlist(x)) |
| 40 | } |
| 41 | return(lapply(x, function(x_) {spec_hist( |
| 42 | x = x_, width = width, height = height, |
| 43 | breaks = breaks, same_lim = same_lim, lim = lim, |
| 44 | xaxt = xaxt, yaxt = yaxt, ann = ann, col = col, border = border, |
| 45 | dir = dir, file = file, file_type = file_type, ... |
| 46 | )})) |
| 47 | } |
| 48 | |
Bill Evans | 8def4da | 2020-09-11 09:58:26 -0700 | [diff] [blame] | 49 | if (is.null(x)) return(NULL) |
| 50 | |
Hao Zhu | 5fe235c | 2020-08-26 00:26:49 -0400 | [diff] [blame] | 51 | if (is.null(lim)) { |
| 52 | lim <- base::range(x) |
| 53 | } |
| 54 | |
| 55 | file_type <- match.arg(file_type, c("svg", "png")) |
| 56 | |
| 57 | if (!dir.exists(dir)) { |
| 58 | dir.create(dir) |
| 59 | } |
| 60 | |
| 61 | if (is.null(file)) { |
Hao Zhu | cd9a581 | 2020-08-26 15:35:30 -0400 | [diff] [blame] | 62 | file <- file.path(dir, paste0( |
| 63 | "hist_", round(as.numeric(Sys.time()) * 1000), ".", file_type)) |
Hao Zhu | 5fe235c | 2020-08-26 00:26:49 -0400 | [diff] [blame] | 64 | } |
| 65 | |
| 66 | if (file_type == "svg") { |
| 67 | grDevices::svg(filename = file, width = width / res, height = height / res, |
| 68 | bg = 'transparent') |
| 69 | } else { |
| 70 | grDevices::png(filename = file, width = width, height = height, res = res, |
| 71 | bg = 'transparent') |
| 72 | } |
| 73 | |
| 74 | graphics::par(mar = c(0, 0, 0.2, 0), lwd=0.5) |
| 75 | graphics::hist(x, breaks = breaks, xlim = lim, border = border, |
| 76 | xaxt = xaxt, yaxt = yaxt, ann = ann, col = col, ...) |
| 77 | grDevices::dev.off() |
| 78 | |
| 79 | if (file_type == "svg") { |
| 80 | svg_xml <- xml2::read_xml(file) |
| 81 | svg_text <- as.character(svg_xml) |
| 82 | unlink(file) |
| 83 | } else { |
| 84 | svg_text <- NULL |
| 85 | } |
| 86 | out <- list(path = file, dev = file_type, type = "hist", |
| 87 | width = width, height = height, res = res, |
| 88 | svg_text = svg_text) |
| 89 | |
| 90 | class(out) <- "kableExtraInlinePlots" |
| 91 | return(out) |
| 92 | } |
| 93 | |
Hao Zhu | defd189 | 2020-09-09 00:08:09 -0400 | [diff] [blame] | 94 | #' Helper functions to generate inline sparklines |
| 95 | #' |
| 96 | #' @description These functions helps you quickly generate sets of sparkline |
| 97 | #' style plots using base R plotting system. Currently, we support histogram, |
| 98 | #' boxplot, and line. You can use them together with `column_spec` to |
| 99 | #' generate inline plot in tables. By default, this function will save images |
| 100 | #' in a folder called "kableExtra" and return the address of the file. |
| 101 | #' |
| 102 | #' @param x Vector of values or List of vectors of values. |
| 103 | #' @param width The width of the plot in pixel |
| 104 | #' @param height The height of the plot in pixel |
| 105 | #' @param res The resolution of the plot. Default is 300. |
| 106 | #' @param add_label For boxplot. T/F to add labels for min, mean and max. |
| 107 | #' @param label_digits If T for add_label, rounding digits for the label. |
| 108 | #' Default is 2. |
| 109 | #' @param same_lim T/F. If x is a list of vectors, should all the plots be |
| 110 | #' plotted in the same range? Default is True. |
| 111 | #' @param lim,xlim,ylim Manually specify plotting range in the form of |
| 112 | #' `c(0, 10)`. `lim` is used in `spec_hist` and `spec_boxplot`; `xlim` |
| 113 | #' and `ylim` are used in `spec_line`. |
| 114 | #' @param xaxt On/Off for xaxis text |
| 115 | #' @param yaxt On/Off for yaxis text |
| 116 | #' @param ann On/Off for annotations (titles and axis titles) |
| 117 | #' @param col Color for the fill of the histogram bar/boxplot box. |
| 118 | #' @param border Color for the border. |
| 119 | #' @param boxlty Boxplot - box boarder type |
| 120 | #' @param medcol Boxplot - median line color |
| 121 | #' @param medlwd Boxplot - median line width |
| 122 | #' @param dir Directory of where the images will be saved. |
| 123 | #' @param file File name. If not provided, a random name will be used |
| 124 | #' @param file_type Graphic device. Support `png` or `svg`. SVG is recommended |
| 125 | #' for HTML output |
| 126 | #' @param ... extraparameters passing to boxplot |
| 127 | #' |
Hao Zhu | 5fe235c | 2020-08-26 00:26:49 -0400 | [diff] [blame] | 128 | #' @export |
| 129 | spec_boxplot <- function(x, width = 200, height = 50, res = 300, |
| 130 | add_label = FALSE, label_digits = 2, |
| 131 | same_lim = TRUE, lim = NULL, |
| 132 | xaxt = 'n', yaxt = 'n', ann = FALSE, |
| 133 | col = "lightgray", border = NULL, |
| 134 | boxlty = 0, medcol = "red", medlwd = 1, |
| 135 | dir = if (is_latex()) rmd_files_dir() else tempdir(), |
| 136 | file = NULL, |
| 137 | file_type = if (is_latex()) "png" else "svg", ...) { |
| 138 | if (is.list(x)) { |
| 139 | if (same_lim & is.null(lim)) { |
| 140 | lim <- base::range(unlist(x)) |
| 141 | } |
| 142 | return(lapply(x, function(x_) {spec_boxplot( |
| 143 | x = x_, width = width, height = height, |
| 144 | add_label = add_label, same_lim = same_lim, lim = lim, |
| 145 | xaxt = xaxt, yaxt = yaxt, ann = ann, |
| 146 | col = col, border = border, |
| 147 | boxlty = boxlty, medcol = medcol, medlwd = medlwd, |
| 148 | dir = dir, file = file, file_type = file_type, ... |
| 149 | )})) |
| 150 | } |
| 151 | |
Bill Evans | 8def4da | 2020-09-11 09:58:26 -0700 | [diff] [blame] | 152 | if (is.null(x)) return(NULL) |
| 153 | |
Hao Zhu | 5fe235c | 2020-08-26 00:26:49 -0400 | [diff] [blame] | 154 | if (is.null(lim)) { |
| 155 | lim <- base::range(x) |
| 156 | lim[1] <- lim[1] - (lim[2] - lim[1]) / 10 |
| 157 | lim[2] <- (lim[2] - lim[1]) / 10 + lim[2] |
| 158 | } |
| 159 | |
| 160 | file_type <- match.arg(file_type, c("svg", "png")) |
| 161 | |
| 162 | if (!dir.exists(dir)) { |
| 163 | dir.create(dir) |
| 164 | } |
| 165 | |
| 166 | if (is.null(file)) { |
Hao Zhu | cd9a581 | 2020-08-26 15:35:30 -0400 | [diff] [blame] | 167 | file <- file.path(dir, paste0( |
| 168 | "hist_", round(as.numeric(Sys.time()) * 1000), ".", file_type)) |
Hao Zhu | 5fe235c | 2020-08-26 00:26:49 -0400 | [diff] [blame] | 169 | } |
| 170 | |
| 171 | if (file_type == "svg") { |
| 172 | grDevices::svg(filename = file, width = width / res, height = height / res, |
| 173 | bg = 'transparent') |
| 174 | } else { |
| 175 | grDevices::png(filename = file, width = width, height = height, res = res, |
| 176 | bg = 'transparent') |
| 177 | } |
| 178 | |
| 179 | graphics::par(mar = c(0, 0, 0, 0)) |
| 180 | |
| 181 | graphics::boxplot(x, horizontal = TRUE, ann = ann, frame = FALSE, bty = 'n', ylim = lim, |
| 182 | col = col, border = border, |
| 183 | boxlty = boxlty, medcol = medcol, medlwd = medlwd, |
| 184 | axes = FALSE, outcex = 0.2, whisklty = 1, |
| 185 | ...) |
| 186 | if (add_label) { |
| 187 | x_median <- round(median(x, na.rm = T), label_digits) |
| 188 | x_min <- round(min(x, na.rm = T), label_digits) |
| 189 | x_max <- round(max(x, na.rm = T), label_digits) |
| 190 | graphics::text(x_median, y = 1.4, labels = x_median, cex = 0.5) |
| 191 | graphics::text(x_min, y = 0.6, labels = x_min, cex = 0.5) |
| 192 | graphics::text(x_max, y = 0.6, labels = x_max, cex = 0.5) |
| 193 | } |
| 194 | grDevices::dev.off() |
| 195 | |
| 196 | if (file_type == "svg") { |
| 197 | svg_xml <- xml2::read_xml(file) |
| 198 | svg_text <- as.character(svg_xml) |
| 199 | unlink(file) |
| 200 | } else { |
| 201 | svg_text <- NULL |
| 202 | } |
| 203 | out <- list(path = file, dev = file_type, type = "boxplot", |
| 204 | width = width, height = height, res = res, |
| 205 | svg_text = svg_text) |
| 206 | class(out) <- "kableExtraInlinePlots" |
| 207 | return(out) |
| 208 | } |
| 209 | |
| 210 | is_latex <- knitr::is_latex_output |
| 211 | |
| 212 | rmd_files_dir <- function(create = TRUE) { |
| 213 | curr_file_name <- sub("\\.[^\\.]*$", "", knitr::current_input()) |
| 214 | dir_name <- paste0(curr_file_name, "_files") |
| 215 | if (!dir.exists(dir_name) & create) dir.create(dir_name) |
Hao Zhu | 7f3fa85 | 2020-08-26 13:55:38 -0400 | [diff] [blame] | 216 | fig_dir_name <- file.path(dir_name, "figure-latex/") |
Hao Zhu | 5fe235c | 2020-08-26 00:26:49 -0400 | [diff] [blame] | 217 | if (!dir.exists(fig_dir_name) & create) dir.create(fig_dir_name) |
| 218 | return(fig_dir_name) |
| 219 | } |
| 220 | |
Hao Zhu | defd189 | 2020-09-09 00:08:09 -0400 | [diff] [blame] | 221 | #' Helper functions to generate inline sparklines |
| 222 | #' |
| 223 | #' @description These functions helps you quickly generate sets of sparkline |
| 224 | #' style plots using base R plotting system. Currently, we support histogram, |
| 225 | #' boxplot, and line. You can use them together with `column_spec` to |
| 226 | #' generate inline plot in tables. By default, this function will save images |
| 227 | #' in a folder called "kableExtra" and return the address of the file. |
| 228 | #' |
| 229 | #' @param x,y Vector of values or List of vectors of values. y is optional. |
| 230 | #' @param width The width of the plot in pixel |
| 231 | #' @param height The height of the plot in pixel |
| 232 | #' @param res The resolution of the plot. Default is 300. |
| 233 | #' @param same_lim T/F. If x is a list of vectors, should all the plots be |
| 234 | #' plotted in the same range? Default is True. |
| 235 | #' @param xlim,ylim Manually specify plotting range in the form of |
| 236 | #' `c(0, 10)`. |
| 237 | #' @param xaxt On/Off for xaxis text |
| 238 | #' @param yaxt On/Off for yaxis text |
| 239 | #' @param ann On/Off for annotations (titles and axis titles) |
| 240 | #' @param col Color for the fill of the histogram bar/boxplot box. |
| 241 | #' @param border Color for the border. |
| 242 | #' @param frame.plot On/Off for surrounding box (`spec_line` only). Default |
| 243 | #' is False. |
| 244 | #' @param lwd Line width for `spec_line`; within `spec_line`, the `minmax` |
| 245 | #' argument defaults to use this value for `cex` for points. Default is 2. |
| 246 | #' @param minmax,min,max Arguments passed to `points` to highlight minimum |
| 247 | #' and maximum values in `spec_line`. If `min` or `max` are `NULL`, they |
| 248 | #' default to the value of `minmax`. Set to an empty `list()` to disable. |
| 249 | #' @param dir Directory of where the images will be saved. |
| 250 | #' @param file File name. If not provided, a random name will be used |
| 251 | #' @param file_type Graphic device. Support `png` or `svg`. SVG is recommended |
| 252 | #' for HTML output. |
| 253 | #' @param ... extra parameters passing to `plot` |
| 254 | #' |
Bill Evans | cebc971 | 2020-08-30 19:55:24 -0700 | [diff] [blame] | 255 | #' @export |
| 256 | spec_line <- function(x, y = NULL, width = 200, height = 50, res = 300, |
| 257 | same_lim = TRUE, xlim = NULL, ylim = NULL, |
| 258 | xaxt = 'n', yaxt = 'n', ann = FALSE, |
| 259 | col = "lightgray", border = NULL, |
| 260 | frame.plot = FALSE, lwd = 2, |
| 261 | minmax = list(pch = ".", cex = lwd, col = "red"), |
| 262 | min = minmax, max = minmax, |
| 263 | dir = if (is_latex()) rmd_files_dir() else tempdir(), |
| 264 | file = NULL, |
| 265 | file_type = if (is_latex()) "png" else "svg", ...) { |
| 266 | if (is.list(x)) { |
Bill Evans | 60fd80b | 2020-09-11 10:40:25 -0700 | [diff] [blame^] | 267 | lenx <- length(x) |
| 268 | |
Bill Evans | cebc971 | 2020-08-30 19:55:24 -0700 | [diff] [blame] | 269 | if (same_lim) { |
| 270 | if (is.null(xlim)) { |
Bill Evans | 60fd80b | 2020-09-11 10:40:25 -0700 | [diff] [blame^] | 271 | xlim <- lapply(x, base::range) |
Bill Evans | cebc971 | 2020-08-30 19:55:24 -0700 | [diff] [blame] | 272 | } |
| 273 | if (is.null(ylim) && !is.null(y)) { |
Bill Evans | 60fd80b | 2020-09-11 10:40:25 -0700 | [diff] [blame^] | 274 | ylim <- lapply(y, base::range) |
Bill Evans | cebc971 | 2020-08-30 19:55:24 -0700 | [diff] [blame] | 275 | } |
| 276 | } |
| 277 | if (is.null(y)) { |
Bill Evans | 60fd80b | 2020-09-11 10:40:25 -0700 | [diff] [blame^] | 278 | y <- replicate(lenx, NULL, simplify = FALSE) |
| 279 | } else if (!is.list(y) || lenx != length(y)) { |
Bill Evans | cebc971 | 2020-08-30 19:55:24 -0700 | [diff] [blame] | 280 | stop("'x' and 'y' are not the same length") |
| 281 | } |
Bill Evans | 60fd80b | 2020-09-11 10:40:25 -0700 | [diff] [blame^] | 282 | |
| 283 | # any of the arguments can be per-plot controlling, but an arg |
| 284 | # that is normally not length-1 may be recycled (incorrectly) by |
| 285 | # Map, so we have to listify them if not already lists; |
| 286 | # enforce a restriction of recycling only length 1 or lenx |
| 287 | |
| 288 | # first, start with the literals (x,y) |
| 289 | # same_lim, not a factor anymore |
| 290 | dots <- list(x = x, y = y) |
| 291 | |
| 292 | # second, we know these args are likely to be vectors (length > 1) |
| 293 | # or lists, so we have to handle them carefully and double-list if |
| 294 | # present |
| 295 | notlen1 <- list(xlim = xlim, ylim = ylim, |
| 296 | minmax = minmax, min = min, max = max) |
| 297 | dots <- c(dots, Map( |
| 298 | function(L, nm) { |
| 299 | if (is.null(L)) return(list(NULL)) |
| 300 | if (!is.list(L) || !is.list(L[[1]])) return(list(L)) |
| 301 | if (!length(L) %in% c(1L, lenx)) { |
| 302 | stop("length of '", nm, "' must be 1 or the same length as 'x'") |
| 303 | } |
| 304 | L |
| 305 | }, notlen1, names(notlen1))) |
| 306 | |
| 307 | # last, all remaining arguments that we don't already know about |
| 308 | # are length-1, so can be easily listified; using 'formals()' |
| 309 | # allows us to not hard-code all params, for future expansion? |
| 310 | len1args <- mget(setdiff(names(formals()), |
| 311 | c(names(dots), "same_lim", "x", "y", "..."))) |
| 312 | dots <- c(dots, Map( |
| 313 | function(V, nm) { |
| 314 | if (is.null(V)) return(list(NULL)) |
| 315 | if (!length(V) %in% c(1L, lenx)) { |
| 316 | stop("length of '", nm, "' must be 1 or the same length as 'x'") |
| 317 | } |
| 318 | V |
| 319 | }, len1args, names(len1args))) |
| 320 | |
| 321 | return(do.call(Map, c(list(f = spec_line), dots))) |
| 322 | |
Bill Evans | cebc971 | 2020-08-30 19:55:24 -0700 | [diff] [blame] | 323 | } |
| 324 | |
Bill Evans | 8def4da | 2020-09-11 09:58:26 -0700 | [diff] [blame] | 325 | if (is.null(x)) return(NULL) |
| 326 | |
Bill Evans | cebc971 | 2020-08-30 19:55:24 -0700 | [diff] [blame] | 327 | if (is.null(y) || !length(y)) { |
| 328 | y <- x |
| 329 | x <- seq(0, 1, length.out = length(y)) |
| 330 | tmp <- ylim |
| 331 | ylim <- xlim |
| 332 | xlim <- tmp |
| 333 | } |
| 334 | |
| 335 | if (is.null(xlim)) { |
| 336 | xlim <- base::range(x) |
| 337 | } |
| 338 | |
| 339 | if (is.null(ylim) && !is.null(y)) { |
| 340 | ylim <- base::range(y) |
| 341 | } |
| 342 | |
| 343 | if (is.null(min)) min <- minmax |
| 344 | if (is.null(max)) max <- minmax |
| 345 | |
| 346 | expand <- c( |
Bill Evans | 60fd80b | 2020-09-11 10:40:25 -0700 | [diff] [blame^] | 347 | if (!is.null(min) && length(min)) -0.04 else 0, |
| 348 | if (!is.null(max) && length(max)) +0.04 else 0) |
| 349 | xlim <- xlim + diff(xlim) * expand |
| 350 | ylim <- ylim + diff(ylim) * expand |
Bill Evans | cebc971 | 2020-08-30 19:55:24 -0700 | [diff] [blame] | 351 | |
| 352 | file_type <- match.arg(file_type, c("svg", "png")) |
| 353 | |
| 354 | if (!dir.exists(dir)) { |
| 355 | dir.create(dir) |
| 356 | } |
| 357 | |
| 358 | if (is.null(file)) { |
| 359 | file <- file.path(dir, paste0( |
| 360 | "hist_", round(as.numeric(Sys.time()) * 1000), ".", file_type)) |
| 361 | } |
| 362 | |
| 363 | if (file_type == "svg") { |
| 364 | grDevices::svg(filename = file, width = width / res, height = height / res, |
| 365 | bg = 'transparent') |
| 366 | } else { |
| 367 | grDevices::png(filename = file, width = width, height = height, res = res, |
| 368 | bg = 'transparent') |
| 369 | } |
| 370 | curdev <- grDevices::dev.cur() |
| 371 | on.exit(grDevices::dev.off(curdev), add = TRUE) |
| 372 | |
| 373 | graphics::par(mar = c(0, 0, 0.2, 0), lwd = lwd) |
Bill Evans | 60fd80b | 2020-09-11 10:40:25 -0700 | [diff] [blame^] | 374 | graphics::plot(x, y, type = "l", xlim = xlim, ylim = ylim, |
Bill Evans | cebc971 | 2020-08-30 19:55:24 -0700 | [diff] [blame] | 375 | xaxt = xaxt, yaxt = yaxt, ann = ann, col = col, |
| 376 | frame.plot = frame.plot, ...) |
| 377 | |
| 378 | if (!is.null(min) && length(min)) { |
| 379 | ind <- which.min(y) |
Bill Evans | 60fd80b | 2020-09-11 10:40:25 -0700 | [diff] [blame^] | 380 | do.call(graphics::points, c(list(x[ind], y[ind], xpd = NA), min)) |
Bill Evans | cebc971 | 2020-08-30 19:55:24 -0700 | [diff] [blame] | 381 | } |
| 382 | |
| 383 | if (!is.null(max) && length(max)) { |
| 384 | ind <- which.max(y) |
Bill Evans | 60fd80b | 2020-09-11 10:40:25 -0700 | [diff] [blame^] | 385 | do.call(graphics::points, c(list(x[ind], y[ind], xpd = NA), max)) |
Bill Evans | cebc971 | 2020-08-30 19:55:24 -0700 | [diff] [blame] | 386 | } |
| 387 | |
| 388 | grDevices::dev.off(curdev) |
| 389 | |
| 390 | if (file_type == "svg") { |
| 391 | svg_xml <- xml2::read_xml(file) |
| 392 | svg_text <- as.character(svg_xml) |
| 393 | unlink(file) |
| 394 | } else { |
| 395 | svg_text <- NULL |
| 396 | } |
| 397 | out <- list(path = file, dev = file_type, type = "line", |
| 398 | width = width, height = height, res = res, |
| 399 | svg_text = svg_text) |
| 400 | |
| 401 | class(out) <- "kableExtraInlinePlots" |
| 402 | return(out) |
| 403 | } |