test_that("html tags removed", {
testing <- data.frame(text =
" The review . text with
a page break.tag without spaces. color ")
results <- token_transcript(testing)
expect_identical(results[[1]], c("the", "review", "text", "with", "a", "page", "break",
"tag", "without", "spaces", "color"))
})