1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62
|
\name{comparison.cloud}
\alias{comparison.cloud}
\title{
Plot a comparison cloud
}
\description{
Plot a cloud comparing the frequencies of words across documents.
}
\usage{
comparison.cloud(term.matrix,scale=c(4,.5), max.words=300,
random.order=FALSE, rot.per=.1,
colors=brewer.pal(max(3,ncol(term.matrix)),"Dark2"),
use.r.layout=FALSE, title.size=3,
title.colors=NULL, match.colors=FALSE,
title.bg.colors="grey90", ...)
}
\arguments{
\item{term.matrix}{A term frequency matrix whose rows represent words and whose columns represent documents.}
\item{scale}{A vector of length 2 indicating the range of the size of the words. }
\item{max.words}{Maximum number of words to be plotted. least frequent terms dropped}
\item{random.order}{plot words in random order. If false, they will be plotted in decreasing frequency}
\item{rot.per}{proportion words with 90 degree rotation}
\item{colors}{Color words in the order of columns in \code{term.matrix}}
\item{use.r.layout}{if false, then c++ code is used for collision detection, otherwise R is used}
\item{title.size}{Size of document titles}
\item{title.colors}{Colors used for document titles. See details.}
\item{match.colors}{Logical: should colors document titles colors match word colors? See details.}
\item{title.bg.colors}{Colors used for the background of document titles.}
\item{...}{Additional parameters to be passed to text (and strheight,strwidth).}
}
\details{
Let \eqn{p_{i,j}} be the rate at which word i occurs in document j, and \eqn{p_j} be the
average across documents(\eqn{\sum_ip_{i,j}/ndocs}). The size of each word is mapped to its maximum deviation
( \eqn{max_i(p_{i,j}-p_j)} ), and its angular position is determined by the document where that maximum occurs.
If \code{title.colors} is not \code{NULL}, it is used for document titles and \code{match.colors} is ignored.
}
\value{
nothing
}
\examples{
if(require(tm)){
data(SOTU)
corp <- SOTU
corp <- tm_map(corp, removePunctuation)
corp <- tm_map(corp, content_transformer(tolower))
corp <- tm_map(corp, removeNumbers)
corp <- tm_map(corp, function(x)removeWords(x,stopwords()))
term.matrix <- TermDocumentMatrix(corp)
term.matrix <- as.matrix(term.matrix)
colnames(term.matrix) <- c("SOTU 2010","SOTU 2011")
comparison.cloud(term.matrix,max.words=40,random.order=FALSE)
comparison.cloud(term.matrix,max.words=40,random.order=FALSE,
title.colors=c("red","blue"),title.bg.colors=c("grey40","grey70"))
comparison.cloud(term.matrix,max.words=40,random.order=FALSE,
match.colors=TRUE)
}
}
|