--
You received this message because you are subscribed to the Google Groups "computationalstylistics" group.
To unsubscribe from this group and stop receiving emails from it, send an email to computationalstylistics+unsub...@googlegroups.com.
Visit this group at https://groups.google.com/group/computationalstylistics.
For more options, visit https://groups.google.com/d/optout.
To unsubscribe from this group and stop receiving emails from it, send an email to computationalstylistics+unsubscr...@googlegroups.com.
# files in corpus are parsed as follows: (a trigram per line)
# this assumes the trigrams respect the desired boundaries
Thi
his
is
s i
is
is
s a
a
a t
te
tes
est
st.
# first, we load the texts from the specified subdirectory
# (type help(load.corpus) to get the applicable options)
raw_texts = load.corpus(files = "all", corpus.dir = "corpus")
# we start an empty list
tokenized_texts = list()
# next, we iterate over the loaded texts
for(i in names(raw_texts)) {
# aggregating the results
tokenized_texts[[i]] = readLines(paste('corpus/', i, sep=""))
}
# inheriting the names of the texts from the original corpus
names(tokenized_texts) = names(raw_texts)
# running `stylo` with a pre-defined corpus
# readLines(paste('corpus_ngramified/', i, sep=""))
x <- stylo(parsed.corpus = tokenized_texts)
library(stylo)
stylo(frequencies = table_with_frequencies)
stylo(parsed.corpus = the_corpus)
sample 5
"tib_carm_3"
[1] i m
[2] m a
[3] m a r
[4] a r t
[5] r t i
[6] t i s
[7] i s
[8] s r
[9] r o
[10] r o m
... ...
load("test.Rdata")
char_3grams
stylo(parsed.corpus = char_3grams)
--
You received this message because you are subscribed to the Google Groups "computationalstylistics" group.
To unsubscribe from this group and stop receiving emails from it, send an email to computationalstylistics+unsub...@googlegroups.com.