r:document_classification
Differences
This shows you the differences between two versions of the page.
| Next revision | Previous revision | ||
| r:document_classification [2016/12/14 09:49] – created hkimscil | r:document_classification [2016/12/14 09:57] (current) – hkimscil | ||
|---|---|---|---|
| Line 1: | Line 1: | ||
| - | ====== | + | ====== |
| - | < | + | |
| - | > c <- tm_map(c, content_transformer(tolower)) | + | |
| - | > c <- tm_map(c, content_transformer(removeNumbers)) | + | |
| - | > c <- tm_map(c, content_transformer(removeNumbers)) | + | |
| - | > x <- TermDocumentMatrix(c) | + | |
| - | > inspect(x[1: | + | |
| - | << | + | |
| - | Non-/sparse entries: 7/93 | + | |
| - | Sparsity | + | |
| - | Maximal term length: 10 | + | |
| - | Weighting | + | |
| - | Docs | ||
| - | Terms 127 144 191 194 211 236 237 242 246 248 | ||
| - | -/, 0 | ||
| - | -foot 0 | ||
| - | -hour 0 | ||
| - | -member | ||
| - | -nation | ||
| - | " | ||
| - | " | ||
| - | " | ||
| - | " | ||
| - | " | ||
| - | > c <- tm_map(c, content_transformer(removePunctuation)) | ||
| - | > x <- TermDocumentMatrix(c) | ||
| - | > inspect(x[1: | ||
| - | << | ||
| - | Non-/sparse entries: 13/87 | ||
| - | Sparsity | ||
| - | Maximal term length: 9 | ||
| - | Weighting | ||
| - | |||
| - | Docs | ||
| - | Terms 127 144 191 194 211 236 237 242 246 248 | ||
| - | abdulaziz | ||
| - | ability | ||
| - | able 0 | ||
| - | about | ||
| - | above | ||
| - | abroad | ||
| - | accept | ||
| - | accord | ||
| - | according | ||
| - | across | ||
| - | > c <- crude | ||
| - | > c <- tm_map(c, content_transformer(tolower)) | ||
| - | > c <- tm_map(c, content_transformer(removePunctuation)) | ||
| - | > c <- tm_map(c, content_transformer(removeNumbers)) | ||
| - | > x <- TermDocumentMatrix(c) | ||
| - | > inspect(x[1: | ||
| - | << | ||
| - | Non-/sparse entries: 13/87 | ||
| - | Sparsity | ||
| - | Maximal term length: 9 | ||
| - | Weighting | ||
| - | |||
| - | Docs | ||
| - | Terms 127 144 191 194 211 236 237 242 246 248 | ||
| - | abdulaziz | ||
| - | ability | ||
| - | able 0 | ||
| - | about | ||
| - | above | ||
| - | abroad | ||
| - | accept | ||
| - | accord | ||
| - | according | ||
| - | across | ||
| - | > | ||
| - | > y <- TermDocumentMatrix(x, | ||
| - | Error in UseMethod(" | ||
| - | no applicable method for ' | ||
| - | > y <- TermDocumentMatrix(c, | ||
| - | > inspect(y[1: | ||
| - | << | ||
| - | Non-/sparse entries: 13/87 | ||
| - | Sparsity | ||
| - | Maximal term length: 9 | ||
| - | Weighting | ||
| - | |||
| - | Docs | ||
| - | Terms | ||
| - | abdulaziz | ||
| - | ability | ||
| - | able 0 0.000000000 | ||
| - | about 0 0.003641675 | ||
| - | above 0 0.012792992 | ||
| - | abroad | ||
| - | accept | ||
| - | accord | ||
| - | according | ||
| - | across | ||
| - | Docs | ||
| - | Terms 237 242 246 248 | ||
| - | abdulaziz 0.00000000 | ||
| - | ability | ||
| - | able 0.00000000 | ||
| - | about | ||
| - | above | ||
| - | abroad | ||
| - | accept | ||
| - | accord | ||
| - | according 0.00000000 | ||
| - | across | ||
| - | > freqTerms <- findFreqTerms(x, | ||
| - | > freqTerms | ||
| - | [1] " | ||
| - | [5] " | ||
| - | [9] " | ||
| - | [13] " | ||
| - | [17] " | ||
| - | [21] " | ||
| - | [25] " | ||
| - | [29] " | ||
| - | [33] " | ||
| - | [37] " | ||
| - | [41] " | ||
| - | [45] " | ||
| - | > findAssocs(x, | ||
| - | $oil | ||
| - | | ||
| - | | ||
| - | who winter | ||
| - | | ||
| - | emergency | ||
| - | | ||
| - | through | ||
| - | | ||
| - | |||
| - | > | ||
| - | </ | ||
r/document_classification.1481678347.txt.gz · Last modified: by hkimscil
