projects
/
iramuteq
/ blobdiff
commit
grep
author
committer
pickaxe
?
search:
re
summary
|
shortlog
|
log
|
commit
|
commitdiff
|
tree
raw
|
inline
| side by side
add R dependencies
[iramuteq]
/
configuration
/
corpus.cfg
diff --git
a/configuration/corpus.cfg
b/configuration/corpus.cfg
index
327f4e8
..
06959bc
100644
(file)
--- a/
configuration/corpus.cfg
+++ b/
configuration/corpus.cfg
@@
-1,12
+1,12
@@
[corpus]
corpus_name =
[corpus]
corpus_name =
-filename =
test.txt
+filename =
originalpath =
encoding = utf8
lang = french
douce = 1
originalpath =
encoding = utf8
lang = french
douce = 1
-ucemethod =
0
-ucesize =
35
+ucemethod =
1
+ucesize =
40
keep_ponct = 0
tolist = 0
etoile = 1
keep_ponct = 0
tolist = 0
etoile = 1
@@
-15,10
+15,12
@@
time =
ucinb =
ucenb =
occurrences =
ucinb =
ucenb =
occurrences =
-keep_caract = ^a-zA-Z0-9Ã Ã
\80
âÃ
\82
äÃ
\84
áÃ
\81
Ã
©Ã
\89
èÃ
\88
êÃ
\8a
ëÃ
\8b
ìÃ
\8c
îÃ
\8e
ïÃ
\8f
òÃ
\92
ôÃ
\94
öÃ
\96
ùÃ
\99
ûÃ
\9b
üÃ
\9c
çÃ
\87
Ã
\9f
Å
\93
Å
\92
â
\80
\99
ñ.:,;!?*
'_-
+keep_caract = ^a-zA-Z0-9Ã Ã
\80
âÃ
\82
äÃ
\84
áÃ
\81
Ã
¥Ã
\85
ãéÃ
\89
èÃ
\88
êÃ
\8a
ëÃ
\8b
ìÃ
\8c
îÃ
\8e
ïÃ
\8f
ÃÃ
\8d
óÃ
\93
òÃ
\92
ôÃ
\94
öÃ
\96
õÃ
\95
øÃ
\98
ùÃ
\99
ûÃ
\9b
üÃ
\9c
úÃ
\9a
çÃ
\87
Ã
\9f
Å
\93
Å
\92
â
\80
\99
ñÃ
\91
.:,;!?
'_-
lower = 1
ucimark = 0
expressions = 1
apos = 1
tiret = 1
firstclean = 1
lower = 1
ucimark = 0
expressions = 1
apos = 1
tiret = 1
firstclean = 1
+charact = 1
+lem = 1