Examples for 'tm::DataframeSource'


Data Frame Source

Aliases: DataframeSource

Keywords:

### ** Examples

docs <- data.frame(doc_id = c("doc_1", "doc_2"),
                   text = c("This is a text.", "This another one."),
                   dmeta1 = 1:2, dmeta2 = letters[1:2],
                   stringsAsFactors = FALSE)
(ds <- DataframeSource(docs))
$encoding
[1] ""

$length
[1] 2

$position
[1] 0

$reader
function (elem, language, id) 
{
    PlainTextDocument(elem$content[, "text"], id = elem$content[, 
        "doc_id"], language = language)
}
<bytecode: 0x55ccfbdca640>
<environment: namespace:tm>

$content
  doc_id              text dmeta1 dmeta2
1  doc_1   This is a text.      1      a
2  doc_2 This another one.      2      b

attr(,"class")
[1] "DataframeSource" "SimpleSource"    "Source"         
x <- Corpus(ds)
inspect(x)
<<SimpleCorpus>>
Metadata:  corpus specific: 1, document level (indexed): 2
Content:  documents: 2

            doc_1             doc_2 
  This is a text. This another one. 
meta(x)
  dmeta1 dmeta2
1      1      a
2      2      b

[Package tm version 0.7-15 Index]