Count words, n-grams, shingles x

⚠️ THIS IS A WORK IN PROGRESS
library(stringr)
top_words <- all_full_txt %>%
unnest_tokens(word, txt) %>%
anti_join(get_stopwords()) %>%
filter(!str_detect(word, "[0-9]+") == TRUE) %>%
group_by(url) %>%
count(word, sort = F) %>%
View()