projects
/
iramuteq
/ blobdiff
commit
grep
author
committer
pickaxe
?
search:
re
summary
|
shortlog
|
log
|
commit
|
commitdiff
|
tree
raw
|
inline
| side by side
...
[iramuteq]
/
configuration
/
corpus.cfg
diff --git
a/configuration/corpus.cfg
b/configuration/corpus.cfg
index
327f4e8
..
190e613
100644
(file)
--- a/
configuration/corpus.cfg
+++ b/
configuration/corpus.cfg
@@
-1,12
+1,12
@@
[corpus]
corpus_name =
[corpus]
corpus_name =
-filename =
test.txt
+filename =
originalpath =
encoding = utf8
lang = french
douce = 1
originalpath =
encoding = utf8
lang = french
douce = 1
-ucemethod =
0
-ucesize =
35
+ucemethod =
1
+ucesize =
40
keep_ponct = 0
tolist = 0
etoile = 1
keep_ponct = 0
tolist = 0
etoile = 1
@@
-15,10
+15,12
@@
time =
ucinb =
ucenb =
occurrences =
ucinb =
ucenb =
occurrences =
-keep_caract = ^a-zA-Z0-9Ã Ã
\80
âÃ
\82
äÃ
\84
áÃ
\81
Ã
©Ã
\89
èÃ
\88
êÃ
\8a
ëÃ
\8b
ìÃ
\8c
îÃ
\8e
ïÃ
\8f
òÃ
\92
ôÃ
\94
öÃ
\96
ùÃ
\99
ûÃ
\9b
üÃ
\9c
çÇßœŒ’ñ.:,;!?*'_-
+keep_caract = ^a-zA-Z0-9Ã Ã
\80
âÃ
\82
äÃ
\84
áÃ
\81
Ã
¥Ã
\85
ãéÃ
\89
èÃ
\88
êÃ
\8a
ëÃ
\8b
ìÃ
\8c
îÃ
\8e
ïÃ
\8f
ÃÃ
\8d
òÃ
\92
ôÃ
\94
öÃ
\96
õÃ
\95
øÃ
\98
ùÃ
\99
ûÃ
\9b
üÃ
\9c
úÃ
\9a
çÇßœŒ’ñ.:,;!?*'_-
lower = 1
ucimark = 0
expressions = 1
apos = 1
tiret = 1
firstclean = 1
lower = 1
ucimark = 0
expressions = 1
apos = 1
tiret = 1
firstclean = 1
+charact = 1
+lem = 1