File: cleannlp.R

package info (click to toggle)

r-cran-nlp 0.3-2-1

links: PTS, VCS
area: main
in suites: forky, sid, trixie
size: 456 kB
sloc: makefile: 2

file content (61 lines) | stat: -rw-r--r-- 1,328 bytes

parent folder | download | duplicates (2)

## Viewer methods for objects of class "cnlp_annotation" as obtained by
## cleanNLP::cnlp_annotate().

words.cnlp_annotation <-
function(x, ...)
{
    x$token$token
}

sents.cnlp_annotation <-
function(x, ...)
{
    x <- x$token
    split(x$token, x$sid)
}

## paras.cnlp_annotation <-
## function(x, ...)
## {
##     x <- x$token
##     if(is.na(match("pid", names(x))))
##         stop("unavailable paragraph ids")
##     lapply(split(x, x$pid),
##            function(e) split(e$token, e$sid))
## }

tagged_words.cnlp_annotation <-
function(x, which = c("upos", "pos"), ...)
{
    x <- x$token
    which <- match.arg(which)
    Tagged_Token(x$token, x[[which]])
}

tagged_sents.cnlp_annotation <-
function(x, which = c("upos", "pos"), ...)
{
    x <- x$token
    which <- match.arg(which)
    .tagged_sents_from_cnlp_token_frame(x, which)
}

.tagged_sents_from_cnlp_token_frame <-
function(x, which)
{
    lapply(split(x, x$sid),
           function(e) Tagged_Token(e$token, e[[which]]))
}

## tagged_paras.cnlp_annotation <-
## function(x, which = c("upos", "pos"), ...)
## {
##     x <- x$token
##     if(is.na(match("pid", names(x))))
##         stop("unavailable paragraph ids")
##     which <- match.arg(which)
##     lapply(split(x, x$pid),
##            .tagged_sents_from_cnlp_token_frame,
##            which)
## }