projects
/
iramuteq
/ blobdiff
commit
grep
author
committer
pickaxe
?
search:
re
summary
|
shortlog
|
log
|
commit
|
commitdiff
|
tree
raw
|
inline
| side by side
...
[iramuteq]
/
configuration
/
corpus.cfg
diff --git
a/configuration/corpus.cfg
b/configuration/corpus.cfg
index
52491e6
..
06959bc
100644
(file)
--- a/
configuration/corpus.cfg
+++ b/
configuration/corpus.cfg
@@
-1,12
+1,12
@@
[corpus]
corpus_name =
[corpus]
corpus_name =
-filename =
test.txt
+filename =
originalpath =
encoding = utf8
lang = french
douce = 1
ucemethod = 1
originalpath =
encoding = utf8
lang = french
douce = 1
ucemethod = 1
-ucesize =
35
+ucesize =
40
keep_ponct = 0
tolist = 0
etoile = 1
keep_ponct = 0
tolist = 0
etoile = 1
@@
-15,10
+15,12
@@
time =
ucinb =
ucenb =
occurrences =
ucinb =
ucenb =
occurrences =
-keep_caract = ^a-zA-Z0-9Ã Ã
\80
âÃ
\82
äÃ
\84
áÃ
\81
Ã¥Ã
\85
ãéÃ
\89
èÃ
\88
êÃ
\8a
ëÃ
\8b
ìÃ
\8c
îÃ
\8e
ïÃ
\8f
ÃÃ
\8d
Ã
²Ã
\92
ôÃ
\94
öÃ
\96
õÃ
\95
øÃ
\98
ùÃ
\99
ûÃ
\9b
üÃ
\9c
úÃ
\9a
çÃ
\87
Ã
\9f
Å
\93
Å
\92
â
\80
\99
ñ.:,;!?*
'_-
+keep_caract = ^a-zA-Z0-9Ã Ã
\80
âÃ
\82
äÃ
\84
áÃ
\81
Ã¥Ã
\85
ãéÃ
\89
èÃ
\88
êÃ
\8a
ëÃ
\8b
ìÃ
\8c
îÃ
\8e
ïÃ
\8f
ÃÃ
\8d
Ã
³Ã
\93
òÃ
\92
ôÃ
\94
öÃ
\96
õÃ
\95
øÃ
\98
ùÃ
\99
ûÃ
\9b
üÃ
\9c
úÃ
\9a
çÃ
\87
Ã
\9f
Å
\93
Å
\92
â
\80
\99
ñÃ
\91
.:,;!?
'_-
lower = 1
ucimark = 0
expressions = 1
apos = 1
tiret = 1
firstclean = 1
lower = 1
ucimark = 0
expressions = 1
apos = 1
tiret = 1
firstclean = 1
+charact = 1
+lem = 1