, , , wordcloud tm.
, , , , , .
, wordcloud
Error in FUN(content(x), ...) : in 'utf8towcs'
- :
words.corpus <- tm_map(words.corpus, tolower)
words.corpus <- tm_map(words.corpus, content_transformer(tolower))
, , :
plot_wordcloud <- function(words, max_words = 70, remove_words ="",
n_colors = 5, palette = "Set1")
{
require(dplyr)
require(wordcloud)
require(RColorBrewer)
require(tm)
words <- iconv(words, "ASCII", "UTF-8", sub="byte")
wc <- wordcloud(words=words.corpus, max.words=max_words,
random.order=FALSE,
colors = brewer.pal(n_colors, palette),
random.color = FALSE,
scale=c(5.5,.5), rot.per=0.35) %>% recordPlot
return(wc)
}
:
words.corpus <- Corpus(VectorSource(words))
:
UTF-8 :
words <- sapply(words, function(x) iconv(enc2utf8(x), sub = "byte"))
for (i in 1:length(words))
{
Encoding(words[[i]])="UTF-8"
}
:
UTF-8 :
words.corpus <- tm_map(words.corpus, removeWords, remove_words)
words.corpus <- tm_map(words.corpus, content_transformer(stringi::stri_trans_tolower))
words.corpus <- tm_map(words.corpus, function(x) iconv(x, to='UTF-8'))
words.corpus <- tm_map(words.corpus, enc2utf8)
words.corpus <- tm_map(words.corpus, tolower)
, , , . . , , , .
, :
words <- iconv(words, "ASCII", "UTF-8", sub="byte")
:
:
http://www.textasdata.com/2015/02/encoding-headaches-emoticons-and-rs-handling-of-utf-816/