├── .Rbuildignore ├── .gitignore ├── DESCRIPTION ├── LICENSE ├── NAMESPACE ├── R ├── compare.r ├── corpus.r ├── data.r ├── deprecation.r ├── lda.r └── tokens.r ├── README.md ├── corpus-tools.Rproj ├── data ├── demo_tokens_amcat.rdata ├── sotu.rda ├── wikinews_iraq.rda ├── wikinews_iraq_dtm_meta.rdata ├── wos_comsci_dtm.rdata └── wos_comsci_meta.rdata ├── howto ├── compare.Rmd ├── compare.html ├── compare.md ├── compare2.Rmd ├── compare_dev.Rmd ├── dtm.Rmd ├── dtm.html ├── dtm.md ├── figures_compare │ ├── unnamed-chunk-6-1.png │ ├── unnamed-chunk-6.png │ ├── unnamed-chunk-7-1.png │ └── unnamed-chunk-7.png ├── figures_dtm │ ├── unnamed-chunk-8-1.png │ └── unnamed-chunk-8.png ├── figures_lda │ ├── unnamed-chunk-7-1.png │ ├── unnamed-chunk-7-2.png │ ├── unnamed-chunk-71.png │ ├── unnamed-chunk-72.png │ ├── unnamed-chunk-8-1.png │ ├── unnamed-chunk-8-2.png │ ├── unnamed-chunk-81.png │ ├── unnamed-chunk-82.png │ ├── unnamed-chunk-9-1.png │ ├── unnamed-chunk-9-2.png │ ├── unnamed-chunk-91.png │ └── unnamed-chunk-92.png ├── howto_compare_corpora.md ├── lda.Rmd ├── lda.html └── lda.md ├── man ├── cast.sparse.matrix.Rd ├── chi2.Rd ├── corpora.compare.Rd ├── corpora.compare.list.Rd ├── create.index.Rd ├── documents.compare.Rd ├── documents.window.compare.Rd ├── documentsums.Rd ├── dtm.create.Rd ├── dtm.filter.Rd ├── dtm.to.df.Rd ├── dtm.to.dfm.Rd ├── dtm.wordcloud.Rd ├── dtmToSparseMatrix.Rd ├── fill.time.gaps.Rd ├── getOverlapTerms.Rd ├── lda.fit.Rd ├── lda.plot.alltopics.Rd ├── lda.plot.category.Rd ├── lda.plot.time.Rd ├── lda.plot.topic.Rd ├── lda.plot.wordcloud.Rd ├── ldavis_json.Rd ├── order.meta.Rd ├── plotWords.Rd ├── prepare.plot.values.Rd ├── prepare.time.var.Rd ├── sotu.Rd ├── splitDtm.Rd ├── term.statistics.Rd ├── term.time.statistics.Rd ├── topics.per.document.Rd └── wikinews_iraq.Rd └── runtopicmodel.r /.Rbuildignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/.Rbuildignore -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- 1 | .Rproj.user 2 | .Rhistory 3 | .RData 4 | -------------------------------------------------------------------------------- /DESCRIPTION: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/DESCRIPTION -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/LICENSE -------------------------------------------------------------------------------- /NAMESPACE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/NAMESPACE -------------------------------------------------------------------------------- /R/compare.r: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/R/compare.r -------------------------------------------------------------------------------- /R/corpus.r: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/R/corpus.r -------------------------------------------------------------------------------- /R/data.r: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/R/data.r -------------------------------------------------------------------------------- /R/deprecation.r: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/R/deprecation.r -------------------------------------------------------------------------------- /R/lda.r: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/R/lda.r -------------------------------------------------------------------------------- /R/tokens.r: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/README.md -------------------------------------------------------------------------------- /corpus-tools.Rproj: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/corpus-tools.Rproj -------------------------------------------------------------------------------- /data/demo_tokens_amcat.rdata: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/data/demo_tokens_amcat.rdata -------------------------------------------------------------------------------- /data/sotu.rda: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/data/sotu.rda -------------------------------------------------------------------------------- /data/wikinews_iraq.rda: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/data/wikinews_iraq.rda -------------------------------------------------------------------------------- /data/wikinews_iraq_dtm_meta.rdata: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/data/wikinews_iraq_dtm_meta.rdata -------------------------------------------------------------------------------- /data/wos_comsci_dtm.rdata: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/data/wos_comsci_dtm.rdata -------------------------------------------------------------------------------- /data/wos_comsci_meta.rdata: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/data/wos_comsci_meta.rdata -------------------------------------------------------------------------------- /howto/compare.Rmd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/compare.Rmd -------------------------------------------------------------------------------- /howto/compare.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/compare.html -------------------------------------------------------------------------------- /howto/compare.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/compare.md -------------------------------------------------------------------------------- /howto/compare2.Rmd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/compare2.Rmd -------------------------------------------------------------------------------- /howto/compare_dev.Rmd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/compare_dev.Rmd -------------------------------------------------------------------------------- /howto/dtm.Rmd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/dtm.Rmd -------------------------------------------------------------------------------- /howto/dtm.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/dtm.html -------------------------------------------------------------------------------- /howto/dtm.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/dtm.md -------------------------------------------------------------------------------- /howto/figures_compare/unnamed-chunk-6-1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/figures_compare/unnamed-chunk-6-1.png -------------------------------------------------------------------------------- /howto/figures_compare/unnamed-chunk-6.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/figures_compare/unnamed-chunk-6.png -------------------------------------------------------------------------------- /howto/figures_compare/unnamed-chunk-7-1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/figures_compare/unnamed-chunk-7-1.png -------------------------------------------------------------------------------- /howto/figures_compare/unnamed-chunk-7.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/figures_compare/unnamed-chunk-7.png -------------------------------------------------------------------------------- /howto/figures_dtm/unnamed-chunk-8-1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/figures_dtm/unnamed-chunk-8-1.png -------------------------------------------------------------------------------- /howto/figures_dtm/unnamed-chunk-8.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/figures_dtm/unnamed-chunk-8.png -------------------------------------------------------------------------------- /howto/figures_lda/unnamed-chunk-7-1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/figures_lda/unnamed-chunk-7-1.png -------------------------------------------------------------------------------- /howto/figures_lda/unnamed-chunk-7-2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/figures_lda/unnamed-chunk-7-2.png -------------------------------------------------------------------------------- /howto/figures_lda/unnamed-chunk-71.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/figures_lda/unnamed-chunk-71.png -------------------------------------------------------------------------------- /howto/figures_lda/unnamed-chunk-72.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/figures_lda/unnamed-chunk-72.png -------------------------------------------------------------------------------- /howto/figures_lda/unnamed-chunk-8-1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/figures_lda/unnamed-chunk-8-1.png -------------------------------------------------------------------------------- /howto/figures_lda/unnamed-chunk-8-2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/figures_lda/unnamed-chunk-8-2.png -------------------------------------------------------------------------------- /howto/figures_lda/unnamed-chunk-81.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/figures_lda/unnamed-chunk-81.png -------------------------------------------------------------------------------- /howto/figures_lda/unnamed-chunk-82.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/figures_lda/unnamed-chunk-82.png -------------------------------------------------------------------------------- /howto/figures_lda/unnamed-chunk-9-1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/figures_lda/unnamed-chunk-9-1.png -------------------------------------------------------------------------------- /howto/figures_lda/unnamed-chunk-9-2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/figures_lda/unnamed-chunk-9-2.png -------------------------------------------------------------------------------- /howto/figures_lda/unnamed-chunk-91.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/figures_lda/unnamed-chunk-91.png -------------------------------------------------------------------------------- /howto/figures_lda/unnamed-chunk-92.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/figures_lda/unnamed-chunk-92.png -------------------------------------------------------------------------------- /howto/howto_compare_corpora.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/howto_compare_corpora.md -------------------------------------------------------------------------------- /howto/lda.Rmd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/lda.Rmd -------------------------------------------------------------------------------- /howto/lda.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/lda.html -------------------------------------------------------------------------------- /howto/lda.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/howto/lda.md -------------------------------------------------------------------------------- /man/cast.sparse.matrix.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/cast.sparse.matrix.Rd -------------------------------------------------------------------------------- /man/chi2.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/chi2.Rd -------------------------------------------------------------------------------- /man/corpora.compare.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/corpora.compare.Rd -------------------------------------------------------------------------------- /man/corpora.compare.list.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/corpora.compare.list.Rd -------------------------------------------------------------------------------- /man/create.index.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/create.index.Rd -------------------------------------------------------------------------------- /man/documents.compare.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/documents.compare.Rd -------------------------------------------------------------------------------- /man/documents.window.compare.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/documents.window.compare.Rd -------------------------------------------------------------------------------- /man/documentsums.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/documentsums.Rd -------------------------------------------------------------------------------- /man/dtm.create.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/dtm.create.Rd -------------------------------------------------------------------------------- /man/dtm.filter.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/dtm.filter.Rd -------------------------------------------------------------------------------- /man/dtm.to.df.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/dtm.to.df.Rd -------------------------------------------------------------------------------- /man/dtm.to.dfm.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/dtm.to.dfm.Rd -------------------------------------------------------------------------------- /man/dtm.wordcloud.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/dtm.wordcloud.Rd -------------------------------------------------------------------------------- /man/dtmToSparseMatrix.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/dtmToSparseMatrix.Rd -------------------------------------------------------------------------------- /man/fill.time.gaps.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/fill.time.gaps.Rd -------------------------------------------------------------------------------- /man/getOverlapTerms.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/getOverlapTerms.Rd -------------------------------------------------------------------------------- /man/lda.fit.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/lda.fit.Rd -------------------------------------------------------------------------------- /man/lda.plot.alltopics.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/lda.plot.alltopics.Rd -------------------------------------------------------------------------------- /man/lda.plot.category.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/lda.plot.category.Rd -------------------------------------------------------------------------------- /man/lda.plot.time.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/lda.plot.time.Rd -------------------------------------------------------------------------------- /man/lda.plot.topic.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/lda.plot.topic.Rd -------------------------------------------------------------------------------- /man/lda.plot.wordcloud.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/lda.plot.wordcloud.Rd -------------------------------------------------------------------------------- /man/ldavis_json.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/ldavis_json.Rd -------------------------------------------------------------------------------- /man/order.meta.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/order.meta.Rd -------------------------------------------------------------------------------- /man/plotWords.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/plotWords.Rd -------------------------------------------------------------------------------- /man/prepare.plot.values.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/prepare.plot.values.Rd -------------------------------------------------------------------------------- /man/prepare.time.var.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/prepare.time.var.Rd -------------------------------------------------------------------------------- /man/sotu.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/sotu.Rd -------------------------------------------------------------------------------- /man/splitDtm.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/splitDtm.Rd -------------------------------------------------------------------------------- /man/term.statistics.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/term.statistics.Rd -------------------------------------------------------------------------------- /man/term.time.statistics.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/term.time.statistics.Rd -------------------------------------------------------------------------------- /man/topics.per.document.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/topics.per.document.Rd -------------------------------------------------------------------------------- /man/wikinews_iraq.Rd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/man/wikinews_iraq.Rd -------------------------------------------------------------------------------- /runtopicmodel.r: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kasperwelbers/corpus-tools/HEAD/runtopicmodel.r --------------------------------------------------------------------------------