#read the csv articletexts <- read_csv("Meta.csv") summary(articletexts) #create a corpus corp = corpus(articletexts, text_field = 'title') corp #stopwords sw <- stopwords("english") sw #tokenize and remove elements tokens <- tokens(corp, remove_punct = T, remove_numbers = T, remove_symbols = T) %>% tokens_remove(sw) %>% tokens_wordstem()
I have tried gsub to remove all letters of the English alphabet.
var
This content, along with any associated source code and files, is licensed under The Code Project Open License (CPOL)