File: comparison.cloud.Rd

package info (click to toggle)
r-cran-wordcloud 2.6-2
  • links: PTS, VCS
  • area: main
  • in suites: bookworm, bullseye, forky, sid, trixie
  • size: 168 kB
  • sloc: cpp: 30; makefile: 2
file content (62 lines) | stat: -rw-r--r-- 2,564 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
\name{comparison.cloud}
\alias{comparison.cloud}
\title{
  Plot a comparison cloud
}
\description{
  Plot a cloud comparing the frequencies of words across documents.
}
\usage{
comparison.cloud(term.matrix,scale=c(4,.5), max.words=300,
	random.order=FALSE, rot.per=.1,
	colors=brewer.pal(max(3,ncol(term.matrix)),"Dark2"),
	use.r.layout=FALSE, title.size=3,
	title.colors=NULL, match.colors=FALSE,
	title.bg.colors="grey90", ...)
}
\arguments{
  \item{term.matrix}{A term frequency matrix whose rows represent words and whose columns represent documents.}
  \item{scale}{A vector of length 2 indicating the range of the size of the words. }
  \item{max.words}{Maximum number of words to be plotted. least frequent terms dropped}
  \item{random.order}{plot words in random order. If false, they will be plotted in decreasing frequency}
  \item{rot.per}{proportion words with 90 degree rotation}
  \item{colors}{Color words in the order of columns in \code{term.matrix}}
  \item{use.r.layout}{if false, then c++ code is used for collision detection, otherwise R is used}
  \item{title.size}{Size of document titles}
  \item{title.colors}{Colors used for document titles. See details.}
  \item{match.colors}{Logical: should colors document titles colors match word colors? See details.}
  \item{title.bg.colors}{Colors used for the background of document titles.}
  \item{...}{Additional parameters to be passed to text (and strheight,strwidth).}
}
\details{
Let \eqn{p_{i,j}} be the rate at which word i occurs in document j, and \eqn{p_j} be the
average across documents(\eqn{\sum_ip_{i,j}/ndocs}). The size of each word is mapped to its maximum deviation
( \eqn{max_i(p_{i,j}-p_j)} ), and its angular position is determined by the document where that maximum occurs.

If \code{title.colors} is not \code{NULL}, it is used for document titles and \code{match.colors} is ignored.
}
\value{
nothing
 }
\examples{

if(require(tm)){
	data(SOTU)
	corp <- SOTU
	corp <- tm_map(corp, removePunctuation)
	corp <- tm_map(corp, content_transformer(tolower))
	corp <- tm_map(corp, removeNumbers)
	corp <- tm_map(corp, function(x)removeWords(x,stopwords()))

	term.matrix <- TermDocumentMatrix(corp)
	term.matrix <- as.matrix(term.matrix)
	colnames(term.matrix) <- c("SOTU 2010","SOTU 2011")
	comparison.cloud(term.matrix,max.words=40,random.order=FALSE)
	comparison.cloud(term.matrix,max.words=40,random.order=FALSE,
		title.colors=c("red","blue"),title.bg.colors=c("grey40","grey70"))
	comparison.cloud(term.matrix,max.words=40,random.order=FALSE,
		match.colors=TRUE)

}

}