projects
/
iramuteq
/ blobdiff
commit
grep
author
committer
pickaxe
?
search:
re
summary
|
shortlog
|
log
|
commit
|
commitdiff
|
tree
raw
|
inline
| side by side
mainly translation and more
[iramuteq]
/
configuration
/
corpus.cfg
diff --git
a/configuration/corpus.cfg
b/configuration/corpus.cfg
index
327f4e8
..
06959bc
100644
(file)
--- a/
configuration/corpus.cfg
+++ b/
configuration/corpus.cfg
@@
-1,12
+1,12
@@
[corpus]
corpus_name =
[corpus]
corpus_name =
-filename =
test.txt
+filename =
originalpath =
encoding = utf8
lang = french
douce = 1
originalpath =
encoding = utf8
lang = french
douce = 1
-ucemethod =
0
-ucesize =
35
+ucemethod =
1
+ucesize =
40
keep_ponct = 0
tolist = 0
etoile = 1
keep_ponct = 0
tolist = 0
etoile = 1
@@
-15,10
+15,12
@@
time =
ucinb =
ucenb =
occurrences =
ucinb =
ucenb =
occurrences =
-keep_caract = ^a-zA-Z0-9Ã Ã
\80
âÃ
\82
äÃ
\84
áÃ
\81
Ã
©Ã
\89
èÃ
\88
êÃ
\8a
ëÃ
\8b
ìÃ
\8c
îÃ
\8e
ïÃ
\8f
òÃ
\92
ôÃ
\94
öÃ
\96
ùÃ
\99
ûÃ
\9b
üÃ
\9c
çÃ
\87
Ã
\9f
Å
\93
Å
\92
â
\80
\99
ñ.:,;!?*
'_-
+keep_caract = ^a-zA-Z0-9Ã Ã
\80
âÃ
\82
äÃ
\84
áÃ
\81
Ã
¥Ã
\85
ãéÃ
\89
èÃ
\88
êÃ
\8a
ëÃ
\8b
ìÃ
\8c
îÃ
\8e
ïÃ
\8f
ÃÃ
\8d
óÃ
\93
òÃ
\92
ôÃ
\94
öÃ
\96
õÃ
\95
øÃ
\98
ùÃ
\99
ûÃ
\9b
üÃ
\9c
úÃ
\9a
çÃ
\87
Ã
\9f
Å
\93
Å
\92
â
\80
\99
ñÃ
\91
.:,;!?
'_-
lower = 1
ucimark = 0
expressions = 1
apos = 1
tiret = 1
firstclean = 1
lower = 1
ucimark = 0
expressions = 1
apos = 1
tiret = 1
firstclean = 1
+charact = 1
+lem = 1