library(tidyverse)
# Note: Slide text scrubbed is a cleaned variant of Slide_text.txt
# generated from Slide_text_pull.py (in the Data folder)
text <- read_file("../../Data/Slide_text_scrubbed.txt")
library(tidytext)
df_doc <- data.frame(text=c(text),
stringsAsFactors = F) %>%
unnest_tokens(word, text)
library(stopwords)
df_doc <- df_doc %>%
anti_join(data.frame(word=stopwords(source="smart"), stringsAsFactors = F))
terms <- df_doc %>%
count(word, sort=TRUE) %>%
ungroup() %>%
rename(freq=n)
write_file(text,"../text_scrubbed.txt")
library(wordcloud2) # Install from Github required
wordcloud2(demoFreq, figPath="../Figures/END_mask.png")