library(kwb.matomo) page_urls <- kwb.matomo::get_pageurls() page_urls$type <- ifelse(grepl(pattern = "/index$|\\?.*$|htm$|html$|pdf$", page_urls$url), "file", "directory") reformat_pageurls_info <- function (page_urls) { file_info <- page_urls[!is.na(page_urls$url),] %>% dplyr::as_data_frame() %>% dplyr::select(.data$url, .data$nb_visits) %>% dplyr::rename(path = .data$url, size = .data$nb_visits) %>% dplyr::mutate( path = stringr::str_remove(.data$path, pattern = "^https://|^http://")) %>% dplyr::mutate( path = stringr::str_remove(.data$path, pattern = "^www\\.")) file_info$type <- ifelse(grepl(pattern = "/index$|\\?.*$|htm$|html$|pdf$", file_info$path), "file", "directory") file_info$size <- kwb.utils::defaultIfNA(file_info$size, 0) file_info <- file_info %>% dplyr::group_by(.data$path, .data$type) %>% dplyr::summarise(size = sum(.data$size)) kwb.utils::moveColumnsToFront(file_info, c("path", "type", "size")) } normalise_pageurls_info <- function (page_urls) { file_info <- kwb.utils::catAndRun("Reformatting the file info table", { reformat_pageurls_info(page_urls) }) structure(file_info, units = list(size = "Number of visits")) } paths <- page_urls[page_urls$type == "directory",] fakin.path.app::plot_path_network(paths = paths$label, remove_common_root = FALSE, max_depth = 3, weight_by = size, sizes = paths$sum_time_spent) fakin.path.app::plot_treemaps_from_path_data(path_data = normalise_pageurls_info(page_urls), root_path = "kompetenz-wasser.de/", n_levels = 2)