blob: 09eea05e09aeecaf486a51d943092fdda8a678ee [file] [log] [blame]
#' Magic mirror that returns kable's attributes
#'
#' @description Mirror mirror tell me, how does this kable look like?
#'
#' @param kable_input The output of kable
#'
#' @examples magic_mirror(knitr::kable(head(mtcars), "html"))
#' @export
magic_mirror <- function(kable_input){
if (!"knitr_kable" %in% attr(kable_input, "class")) {
warning("magic_mirror may not be able to produce correct result if the",
" input table is not rendered by knitr::kable. ")
}
if ("kable_meta" %in% names(attributes(kable_input))) {
return(attr(kable_input, "kable_meta"))
}
kable_format <- attr(kable_input, "format")
if (kable_format == "latex") {
kable_info <- magic_mirror_latex(kable_input)
}
if (kable_format == "html") {
kable_info <- magic_mirror_html(kable_input)
}
return(kable_info)
}
# Magic mirror for latex tables --------------
magic_mirror_latex <- function(kable_input){
kable_info <- list(tabular = NULL, booktabs = FALSE, align = NULL,
valign = NULL, ncol = NULL, nrow = NULL, colnames = NULL,
rownames = NULL, caption = NULL, caption.short = NULL,
contents = NULL,
centering = FALSE, table_env = FALSE)
# Tabular
kable_info$tabular <- ifelse(
grepl("\\\\begin\\{tabular\\}", kable_input),
"tabular", "longtable"
)
# Booktabs
kable_info$booktabs <- grepl("\\\\toprule", kable_input)
# Align
kable_info$align <- gsub("\\|", "", str_match(
kable_input, paste0("\\\\begin\\{",
kable_info$tabular,"\\}.*\\{(.*?)\\}"))[2])
kable_info$align_vector <- unlist(strsplit(kable_info$align, ""))
kable_info$align_vector_origin <- kable_info$align_vector
# valign
kable_info$valign <- gsub("\\|", "", str_match(
kable_input, paste0("\\\\begin\\{", kable_info$tabular,"\\}(.*)\\{.*?\\}"))[2])
kable_info$valign2 <- sub("\\[", "\\\\[", kable_info$valign)
kable_info$valign2 <- sub("\\]", "\\\\]", kable_info$valign2)
kable_info$valign3 <- sub("\\[", "", kable_info$valign)
kable_info$valign3 <- sub("\\]", "", kable_info$valign3)
kable_info$begin_tabular <- paste0("\\\\begin\\{", kable_info$tabular, "\\}",
kable_info$valign2)
kable_info$end_tabular <- paste0("\\\\end\\{", kable_info$tabular, "\\}")
# N of columns
kable_info$ncol <- nchar(kable_info$align)
# Caption
if (str_detect(kable_input, "caption\\[")) {
caption_line <- str_match(kable_input, "\\\\caption(.*)\\n")[2]
kable_info$caption.short <- str_match(caption_line, "\\[(.*?)\\]")[2]
kable_info$caption <- substr(caption_line,
nchar(kable_info$caption.short) + 4,
nchar(caption_line))
} else {
kable_info$caption <- str_match(kable_input, "caption\\{(.*?)\\n")[2]
}
if (kable_info$tabular == "longtable") {
kable_info$caption <- str_sub(kable_info$caption, 1, -4)
} else {
kable_info$caption <- str_sub(kable_info$caption, 1, -2)
}
# Contents
kable_info$contents <- str_match_all(kable_input, "\n(.*)\\\\\\\\")[[1]][,2]
kable_info$contents <- regex_escape(kable_info$contents, T)
if (kable_info$tabular == "longtable" & !is.na(kable_info$caption) &
!str_detect(kable_input, "\\\\begin\\{table\\}\\n\\n\\\\caption")) {
kable_info$contents <- kable_info$contents[-1]
}
if (!is.null(attr(kable_input, "n_head"))) {
n_head <- attr(kable_input, "n_head")
kable_info$new_header_row <- kable_info$contents[seq(n_head - 1, 1)]
kable_info$contents <- kable_info$contents[-seq(1, n_head - 1)]
kable_info$header_df <- extra_header_to_header_df(kable_info$new_header_row)
kable_info$new_header_row <- paste0(kable_info$new_header_row, "\\\\\\\\")
}
kable_info$nrow <- length(kable_info$contents)
kable_info$duplicated_rows <- (sum(duplicated(kable_info$contents)) != 0)
# Column names
if (kable_info$booktabs & !grepl("\\\\midrule", kable_input)) {
kable_info$colnames <- NULL
kable_info$position_offset <- 0
} else {
kable_info$colnames <- str_split(kable_info$contents[1], " \\& ")[[1]]
kable_info$position_offset <- 1
}
# Row names
kable_info$rownames <- str_extract(kable_info$contents, "^[^ &]*")
kable_info$centering <- grepl("\\\\centering", kable_input)
kable_info$table_env <- (!is.na(kable_info$caption) &
kable_info$tabular != "longtable")
return(kable_info)
}
extra_header_to_header_df <- function(extra_header_rows) {
lapply(str_split(extra_header_rows, " \\& "), function(x) {
as.data.frame(t(sapply(x, extra_header_to_header_df_)), row.names = NA)
})
}
extra_header_to_header_df_ <- function(x) {
if (trimws(x) == "") return(c(header = " ", colspan = "1"))
x <- trimws(x)
x_header <- str_match(x, "([^\\}\\{]*)\\\\\\}$")[2]
x_colspan <- str_match(x, "^\\\\\\\\multicolumn\\\\\\{([^\\\\\\}]*)")[2]
return(c(header = x_header, colspan = x_colspan))
}
# Magic Mirror for html table --------
magic_mirror_html <- function(kable_input){
kable_info <- list()
kable_xml <- read_kable_as_xml(kable_input)
# Caption
kable_info$caption <- xml_text(xml_child(kable_xml, "caption"))
# Contents
# kable_info$contents <- html_table(read_html(as.character(kable_input)))[[1]]
# colnames
kable_info$colnames <- lapply(xml_children(xml_child(kable_xml, "thead")),
xml_children)
kable_info$colnames <- kable_info$colnames[[length(kable_info$colnames)]]
kable_info$colnames <- trimws(xml_text(kable_info$colnames))
kable_info$ncol <- length(kable_info$colnames)
kable_info$nrow_header <- length(xml_children(xml_child(kable_xml, "thead")))
kable_info$nrow_body <- nrow(kable_info$contents)
kable_info$table_class <- xml_attr(kable_xml, "class")
kable_info$table_style <- xml_attr(kable_xml, "style")
return(kable_info)
}