projects
/
iramuteq
/ blobdiff
commit
grep
author
committer
pickaxe
?
search:
re
summary
|
shortlog
|
log
|
commit
|
commitdiff
|
tree
raw
|
inline
| side by side
keyframe
[iramuteq]
/
configuration
/
corpus.cfg
diff --git
a/configuration/corpus.cfg
b/configuration/corpus.cfg
index
327f4e8
..
06959bc
100644
(file)
--- a/
configuration/corpus.cfg
+++ b/
configuration/corpus.cfg
@@
-1,12
+1,12
@@
[corpus]
corpus_name =
[corpus]
corpus_name =
-filename =
test.txt
+filename =
originalpath =
encoding = utf8
lang = french
douce = 1
originalpath =
encoding = utf8
lang = french
douce = 1
-ucemethod =
0
-ucesize =
35
+ucemethod =
1
+ucesize =
40
keep_ponct = 0
tolist = 0
etoile = 1
keep_ponct = 0
tolist = 0
etoile = 1
@@
-15,10
+15,12
@@
time =
ucinb =
ucenb =
occurrences =
ucinb =
ucenb =
occurrences =
-keep_caract = ^a-zA-Z0-9Ã Ã
\80
âÃ
\82
äÃ
\84
áÃ
\81
Ã
©Ã
\89
èÃ
\88
êÃ
\8a
ëÃ
\8b
ìÃ
\8c
îÃ
\8e
ïÃ
\8f
òÃ
\92
ôÃ
\94
öÃ
\96
ùÃ
\99
ûÃ
\9b
üÃ
\9c
çÃ
\87
Ã
\9f
Å
\93
Å
\92
â
\80
\99
ñ.:,;!?*
'_-
+keep_caract = ^a-zA-Z0-9Ã Ã
\80
âÃ
\82
äÃ
\84
áÃ
\81
Ã
¥Ã
\85
ãéÃ
\89
èÃ
\88
êÃ
\8a
ëÃ
\8b
ìÃ
\8c
îÃ
\8e
ïÃ
\8f
ÃÃ
\8d
óÃ
\93
òÃ
\92
ôÃ
\94
öÃ
\96
õÃ
\95
øÃ
\98
ùÃ
\99
ûÃ
\9b
üÃ
\9c
úÃ
\9a
çÃ
\87
Ã
\9f
Å
\93
Å
\92
â
\80
\99
ñÃ
\91
.:,;!?
'_-
lower = 1
ucimark = 0
expressions = 1
apos = 1
tiret = 1
firstclean = 1
lower = 1
ucimark = 0
expressions = 1
apos = 1
tiret = 1
firstclean = 1
+charact = 1
+lem = 1