Tutoriel koRpus/test script
Aller à la navigation
Aller à la recherche
library("koRpus")
# Exemple à adapter !
# fichier_exemple = "/home/schneide/schneide/methodo/iramuteq/w_txt/Alice.txt"
setwd("c:/dks/methodo")
getwd()
fichier_exemple = "./iramuteq/w_txt/Alice.txt"
# Simple tokenizing
tagged.text.obj <- tokenize(fichier_exemple,
lang="en",
detect=c(parag=TRUE, hline=TRUE))
taggedText(tagged.text.obj)
# Avec TreeTagger
tagged.text.objS4 <- treetag(fichier_exemple,
treetagger="manual",
lang="fr",
TT.options= list (path="C:/soft/TreeTagger", preset="fr-utf8"))
# tagged.text2.objS4 <- treetag(fichier_exemple,
# treetagger="manual",
# lang="fr",
# TT.options= list (path="/home/schneide/tree-tagger/", preset="fr-utf8"))
ARI (tagged.text.objS4)
readability(tagged.text.objS4, hyphen=NULL,
index=c("ARI", "Bormuth", "Coleman", "Coleman.Liau", "Dale.Chall", "Danielson.Bryan",
"Dickes.Steiwer","DRP", "ELF",
"Farr.Jenkins.Paterson", "Flesch", "Flesch.Kincaid", "FOG", "FORCAST", "Fucks",
"Harris.Jacobson", "Linsear.Write", "LIX",
"nWS", "RIX", "SMOG", "Spache", "Strain", "Traenkle.Bailer", "TRI",
"Wheeler.Smith")
)
set.kRp.env (TT.cmd = "/home/schneide/tree-tagger/cmd/tree-tagger-french", lang="fr-utf8")
ARI ("/mnt/schneide/methodo/iramuteq/w_txt/Alice.txt",
tagger = "kRp.env")
ARI ("/mnt/schneide/methodo/iramuteq/w_txt/Activate.txt", tagger = "kRp.env")
ARI ("/mnt/schneide/methodo/iramuteq/w_txt/Mon-entretien-d-embauche.txt", tagger = "kRp.env")
MTLD (tagged.text.objS4)
MTLD (tagged.text2.objS4)
MTLD ("/mnt/schneide/methodo/iramuteq/w_txt/Mon-entretien-d-embauche.txt")
lex.div (tagged.text.objS4)
R.ld(tagged.text.objS4)
R.ld(tagged.text2.objS4)
plot(tagged.text2.objS4)