test_that("html tags removed", { testing <- data.frame(text = " The review . text with
a page break.tag without spaces. color ") results <- token_transcript(testing) expect_identical(results[[1]], c("the", "review", "text", "with", "a", "page", "break", "tag", "without", "spaces", "color")) })