# tests/testthat/test-dolphins.R library(testthat) library(arlclustering) #library(igraph) library(arules) library(microbenchmark) library(ggplot2) test_that("Word Adjacency Network Analysis", { # Define the path to the dataset dataset_path <- system.file("extdata", "word_adjacencies.gml", package = "arlclustering") if (dataset_path == "") { stop("word_adjacencies.gml file not found in the package") } # Ensure the file exists expect_true(file.exists(dataset_path)) timings <- list() # Load the network dataset timings[["Load Network"]] <- microbenchmark( g <- arlc_get_network_dataset(dataset_path, "Word Adjacencies"), times = 1 ) # Ensure the dataset is loaded correctly expect_true(!is.null(g)) expect_true("graph" %in% names(g)) expect_true("graphLabel" %in% names(g)) # Generate transactions from the graph timings[["Generate Transactions"]] <- microbenchmark( transactions <- arlc_gen_transactions(g$graph), times = 1 ) expect_true(!is.null(transactions)) expect_s4_class(transactions, "transactions") # Get apriori thresholds timings[["Get Apriori Thresholds"]] <- microbenchmark( params <- arlc_get_apriori_thresholds(transactions, supportRange = seq(0.05, 0.06, by = 0.01), 0.5), times = 1 ) expect_true(!is.null(params)) expect_true("minSupp" %in% names(params)) expect_true("minConf" %in% names(params)) expect_true("lenRules" %in% names(params)) # Generate gross rules timings[["Generate Gross Rules"]] <- microbenchmark( grossRules <- arlc_gen_gross_rules(transactions, minSupp = params$minSupp, minConf = params$minConf, minLenRules = 2, maxLenRules = params$lenRules), times = 1 ) expect_true(!is.null(grossRules$GrossRules)) expect_true("GrossRules" %in% names(grossRules)) # Get non-redundant rules timings[["Filter gross from redundant rules"]] <- microbenchmark( NonRedRules <- arlc_get_NonR_rules(grossRules$GrossRules), times = 1 ) expect_true(!is.null(NonRedRules$FiltredRules)) expect_true("FiltredRules" %in% names(NonRedRules)) # Get significant non-redundant rules timings[["Filter redundant from non-significant rules"]] <- microbenchmark( NonRSigRules <- arlc_get_significant_rules(transactions, NonRedRules$FiltredRules), times = 1 ) expect_true(!is.null(NonRSigRules$FiltredRules)) expect_true("FiltredRules" %in% names(NonRSigRules)) # Clean final rules timings[["Clean Final Rules"]] <- microbenchmark( cleanedRules <- arlc_clean_final_rules(NonRSigRules$FiltredRules), times = 1 ) expect_true(!is.null(cleanedRules)) # Generate clusters timings[["Generate Clusters"]] <- microbenchmark( c <- arlc_generate_clusters(cleanedRules), times = 1 ) expect_true(!is.null(c)) expect_true("Clusters" %in% names(c)) # Plot clusters timings[["Plot Clusters"]] <- microbenchmark( plot <- arlc_clusters_plot(g$graph, g$graphLabel, c$Clusters), times = 1 ) #expect_true(!is.null(plot)) # Combine timings into a data frame for plotting timing_data <- do.call(rbind, lapply(names(timings), function(name) { data.frame( Step = name, Time = summary(timings[[name]])$mean / 1e6 # Convert to milliseconds ) })) # Plot the timing data ggplot(timing_data, aes(x = Step, y = Time)) + geom_bar(stat = "identity") + labs(title = "Execution Time of Steps in Word Adjacencies Network Analysis", x = "Step", y = "Time (ms)") + theme(axis.text.x = element_text(angle = 45, hjust = 1)) })