X-Git-Url: http://iramuteq.org/git?a=blobdiff_plain;ds=inline;f=ProfList.py;h=e882f7ebd126751f3e78f79e7f5d6f280c03b952;hb=a08aea7209aa958dee6b6337525b8036b9215100;hp=7ac42c54a04fa040b677347ba898bc664f632744;hpb=e033f9e84abb3c12d92f1580425877aa58e9af30;p=iramuteq
diff --git a/ProfList.py b/ProfList.py
index 7ac42c5..e882f7e 100644
--- a/ProfList.py
+++ b/ProfList.py
@@ -27,7 +27,7 @@ import webbrowser
#import cStringIO
import tempfile
import codecs
-from functions import exec_rcode, MessageImage, progressbar, treat_var_mod
+from functions import exec_rcode, MessageImage, progressbar, treat_var_mod, doconcorde
from PrintRScript import barplot
from textclassechd import ClasseCHD
from shutil import copyfile
@@ -101,7 +101,7 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col
self.InsertColumn(0, "num", wx.LIST_FORMAT_RIGHT)
- self.InsertColumn(1, "eff. uce", wx.LIST_FORMAT_RIGHT)
+ self.InsertColumn(1, "eff. s.t.", wx.LIST_FORMAT_RIGHT)
self.InsertColumn(2, "eff. total", wx.LIST_FORMAT_RIGHT)
self.InsertColumn(3, "pourcentage", wx.LIST_FORMAT_RIGHT)
self.InsertColumn(4, "chi2", wx.LIST_FORMAT_RIGHT)
@@ -134,7 +134,7 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col
#events
#self.Bind(wx.EVT_LIST_ITEM_SELECTED, self.OnItemSelected)
- #self.Bind(wx.EVT_LIST_ITEM_ACTIVATED, self.OnItemActivated)
+ self.Bind(wx.EVT_LIST_ITEM_ACTIVATED, self.OnPopupTwo, self)
#self.Bind(wx.EVT_LIST_ITEM_DESELECTED, self.OnItemDeselected)
self.Bind(wx.EVT_LIST_COL_CLICK, self.OnColClick)
@@ -147,6 +147,7 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col
#for searching
search_id = wx.NewId()
searchall_id = wx.NewId()
+ concord_id = wx.NewId()
self.parent.Bind(wx.EVT_MENU, self.onsearch, id = search_id)
self.parent.Bind(wx.EVT_MENU, self.onsearchall, id = searchall_id)
self.accel_tbl = wx.AcceleratorTable([(wx.ACCEL_CTRL, ord('F'), search_id),
@@ -271,7 +272,10 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col
self.idwordgraph = wx.NewId()
self.popup_proxe = wx.NewId()
self.idlexdendro = wx.NewId()
+ self.idcloud = wx.NewId()
self.idexport = wx.NewId()
+ self.idexporttropes = wx.NewId()
+ self.idexportowledge = wx.NewId()
# self.export_classes = wx.NewId()
self.Bind(wx.EVT_MENU, self.OnPopupOne, id=self.popupID1)
@@ -292,7 +296,10 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col
self.Bind(wx.EVT_MENU, self.onwordgraph, id = self.idwordgraph)
self.Bind(wx.EVT_MENU, self.onproxe, id = self.popup_proxe)
self.Bind(wx.EVT_MENU, self.onlexdendro, id = self.idlexdendro)
+ self.Bind(wx.EVT_MENU, self.oncloud, id = self.idcloud)
self.Bind(wx.EVT_MENU, self.onexport, id = self.idexport)
+ self.Bind(wx.EVT_MENU, self.onexporttropes, id = self.idexporttropes)
+ self.Bind(wx.EVT_MENU, self.onexportowledge, id = self.idexportowledge)
# self.Bind(wx.EVT_MENU, self.on_export_classes, id = self.export_classes)
# self.Bind(wx.EVT_MENU, self.OnPopupThree, id=self.popupID3)
@@ -308,9 +315,9 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col
#menu.Append(self.popupID10, u"Spécificités")
menu_conc = wx.Menu()
- menu_conc.Append(self.popupID2, u"dans les uce de la classe")
- menu_conc.Append(self.popupID3, u"dans les uce classées")
- menu_conc.Append(self.popupID4, u"dans toutes les uce")
+ menu_conc.Append(self.popupID2, u"dans les segments de texte de la classe")
+ menu_conc.Append(self.popupID3, u"dans les segments de texte classés")
+ menu_conc.Append(self.popupID4, u"dans tous les segments de texte")
menu.AppendMenu(-1, u"Concordancier", menu_conc)
menu_cnrtl = wx.Menu()
menu_cnrtl.Append(self.popupID5, u"Définition")
@@ -323,8 +330,11 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col
menu.AppendSeparator()
menu.Append(self.popupIDgraph, u"Graphe de la classe")
menu.Append(self.idseg, u"Segments répétés")
- menu.Append(self.iducecarac, u"UCE caractéristiques")
- menu.Append(self.idexport, 'Exporter...')
+ menu.Append(self.iducecarac, u"Segments de texte caractéristiques")
+ menu.Append(self.idcloud, u"Nuage de la classe")
+ menu.Append(self.idexport, u'Exporter...')
+ menu.Append(self.idexporttropes, 'Exporter pour Tropes')
+ menu.Append(self.idexportowledge, 'Exporter pour Owledge')
#menu.Append(self.popupID2, u"Concordancier")
# menu.Append(self.popupID3, "recharger")
@@ -347,16 +357,56 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col
self.PopupMenu(menu)
menu.Destroy()
+ def oncloud(self, evt) :
+ if 'corpus' in dir(self.Source):
+ corpus = self.Source.corpus
+ prof = [[self.la[i], self.lchi[i], self.lfreq[i]] for i, val in enumerate(self.la)]
+ parametres = self.Source.parametres
+ parametres['clusterprof'] = prof
+ parametres['type'] = 'clustercloud'
+ parametres['prof'] = self.Source.pathout['actprof_classe_%i.csv' % self.cl]
+ del parametres['uuid']
+ #if not os.path.exists(self.Source.pathout['actprof_classe_%i.csv' % self.lc]) :
+ # with open(self.Source.pathout['actprof_classe_%i.csv' % self.lc], 'w') as f :
+ # f.write('\n'.join(prof).encode(self.parent.syscoding))
+ self.parent.OnClusterCloud(self.Source.corpus, parametres = parametres)
+
def onexport(self, evt) :
if 'corpus' in dir(self.Source):
corpus = self.Source.corpus
- corpus.export_classe(self.Source.pathout['classe_%i_export.txt' % self.cl], self.cl)
+ if self.Source.parametres['classif_mode'] != 2 :
+ uci = False
+ else :
+ uci = True
+ corpus.export_classe(self.Source.pathout['classe_%i_export.txt' % self.cl], self.cl, uci = uci)
dial = wx.MessageDialog(self, self.Source.pathout['classe_%i_export.txt' % self.cl], u"Export", wx.OK|wx.ICON_INFORMATION)
dial.ShowModal()
dial.Destroy()
#if 'corpus' in dir(self.Source):
# corpus = self.Source.corpus
#ClasseCHD(self.parent, corpus, self.cl)
+
+ def onexporttropes(self, evt) :
+ if 'corpus' in dir(self.Source):
+ corpus = self.Source.corpus
+ if self.Source.parametres['classif_mode'] != 2 :
+ uci = False
+ else :
+ uci = True
+ fileout = self.Source.pathout['export_tropes_classe_%i.txt' % self.cl]
+ corpus.export_tropes(fileout, self.cl, uci = uci)
+
+ def onexportowledge(self, evt):
+ if 'corpus' in dir(self.Source):
+ corpus = self.Source.corpus
+ if self.Source.parametres['classif_mode'] != 2 :
+ uci = False
+ else :
+ uci = True
+ repout = self.Source.pathout['export_owledge_classe_%i' % self.cl]
+ if not os.path.exists(repout) :
+ os.mkdir(repout)
+ corpus.export_owledge(repout, self.cl, uci = uci)
def getselectedwords(self) :
words = [self.getColumnText(self.GetFirstSelected(), 6)]
@@ -416,6 +466,10 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col
tableau = self.Source.tableau
tab = tableau.make_table_from_classe(self.cl, self.la)
pathout = ConstructPathOut(self.Source.pathout.dirout, 'simi_classe_%i' %self.cl)
+ if self.tmpchi is None :
+ self.tmpchi = os.path.join(pathout,'chi.csv')
+ with open(self.tmpchi, 'w') as f:
+ f.write('\n'.join([str(val) for val in self.lchi]))
self.filename = os.path.join(pathout,'mat01.csv')
tableau.printtable(self.filename, tab)
del tab
@@ -451,12 +505,13 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col
'film': False,
'com' : 0,
'communities' : 0,
- 'halo' : 0
+ 'halo' : 0,
+ 'tmpchi': self.tmpchi
}
act = {}
tableau.chi = {}
tableau.lchi = self.lchi
- tableau.parametre['fromprof'] = True
+ tableau.parametres['fromprof'] = True
for i, val in enumerate(self.la) :
act[val] = [self.lfreq[i]]
tableau.chi[val] = [self.lchi[i]]
@@ -465,7 +520,7 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col
def onwordgraph(self, evt):
word = self.getColumnText(self.GetFirstSelected(), 6)
if self.tmpchi is None :
- self.tmpchi = tempfile.mktemp(dir=self.Source.parent.TEMPDIR)
+ self.tmpchi = os.path.join(self.Source.parametres['pathout'],'chi_%i.csv' % self.cl)
with open(self.tmpchi, 'w') as f:
f.write('\n'.join([str(val) for val in self.lchi]))
index = self.la.index(word)
@@ -481,7 +536,7 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col
def on_graph(self, evt):
if self.tmpchi is None :
- self.tmpchi = tempfile.mktemp(dir=self.Source.parent.TEMPDIR)
+ self.tmpchi = os.path.join(self.Source.parametres['pathout'],'chi_%i.csv' % self.cl)
with open(self.tmpchi, 'w') as f:
f.write('\n'.join([str(val) for val in self.lchi]))
parametres = {'type' : 'clustersimitxt',
@@ -495,10 +550,14 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col
dlg = progressbar(self, 2)
corpus = self.Source.corpus
uces = corpus.lc[self.cl-1]
+ if self.Source.parametres['classif_mode'] != 2 :
+ uci = False
+ else :
+ uci = True
l = []
dlg.Update(1, u'Segments...')
for i in range(2,10) :
- li = corpus.find_segments_in_classe(uces, i, 1000)
+ li = corpus.find_segments_in_classe(uces, i, 1000, uci = uci)
if li == [] :
break
else :
@@ -523,7 +582,11 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col
dlg = progressbar(self,maxi = 4)
corpus = self.Source.corpus
uces = corpus.lc[self.cl-1]
- tab = corpus.make_table_with_classe(uces, self.la)
+ if self.Source.parametres['classif_mode'] != 2 :
+ uci = False
+ else :
+ uci = True
+ tab = corpus.make_table_with_classe(uces, self.la, uci = uci)
tab.pop(0)
dlg.Update(2, u'score...')
if atype == 0 :
@@ -536,25 +599,12 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col
ntab2 = ntab2[:limite]
nuces = [val[1] for val in ntab2]
dlg.Update(3, u'concordancier...')
- #ucestxt = [corpus.ucis_paras_uces[val[1][0]][val[1][1]][val[1][2]] for val in ntab2]
- ucestxt1 = [row for row in corpus.getconcorde(nuces)]
- ucestxt = []
- ucis_txt = []
- for uce in ucestxt1 :
- ucetxt = ' '+uce[1]+' '
- ucis_txt.append(' '.join(corpus.ucis[corpus.getucefromid(uce[0]).uci].etoiles) + '
')
- for lem in self.la :
- listmot = corpus.getlems()[lem].formes
- for id in listmot :
- forme = corpus.getforme(id).forme
- ucetxt = ucetxt.replace(' '+forme+' ', ' ' + forme + ' ')
- ucestxt.append(ucetxt)
- #ucestxt = [corpus.make_concord(self.la, ' '.join(uce), 'red') for uce in ucestxt]
+ ucis_txt, ucestxt = doconcorde(corpus, nuces, self.la, uci = uci)
+ items = dict([[i, '
'.join([ucis_txt[i], '
' % ntab2[i][0], ucestxt[i]])] for i in range(0,len(ucestxt))])
dlg.Update(4, u'texte...')
- #ucis_txt = [' '.join(corpus.ucis[val[1][0]][0]) for val in ntab2]
- win = message(self, u"UCE caractéristiques - Classe %i" % self.cl, (750, 600))
- win.html = '\n' + '
'.join(['
'.join([ucis_txt[i], 'score : ' + str(ntab2[i][0]), ucestxt[i]]) for i in range(0,len(ucestxt))]) + '\n'
- win.HtmlPage.SetPage(win.html)
+ win = message(self, items, u"Segments de texte caractéristiques - Classe %i" % self.cl, (750, 600))
+ #win.html = '\n' + '
'.join(['
'.join([ucis_txt[i], '' % ntab2[i][0], ucestxt[i]]) for i in range(0,len(ucestxt))]) + '\n'
+ #win.HtmlPage.SetPage(win.html)
dlg.Destroy()
win.Show(True)
@@ -642,7 +692,6 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col
win.HtmlPage.SetPage(txt)
win.Show(True)
-
def make_concord(self, uces, title, color = 'red') :
corpus = self.Source.corpus
ListWord = [self.getColumnText(self.GetFirstSelected(), 6)]
@@ -650,33 +699,29 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col
while self.GetNextSelected(last) != -1:
last = self.GetNextSelected(last)
ListWord.append(self.getColumnText(last, 6))
- listmot = [forme for item in ListWord for forme in corpus.getlems()[item].formes]
- win = message(self, title, size=(750, 600))
- toshow = ['\nConcordancier
\n']
- toshow.append('' % color + ' '.join(ListWord) + '
')
- duce = {}
ucef = []
- for word in ListWord :
- ucef += list(set(corpus.getlemuces(word)).intersection(uces))
- ucef = list(set(ucef))
- ucef.sort()
- res = corpus.getconcorde(ucef)
- txt = '
'.join(toshow) +'
'
- for uce in res :
- ucetxt = ' '+uce[1]+' '
- txt += ' '.join(corpus.ucis[corpus.getucefromid(uce[0]).uci].etoiles) + '
'
- for forme in listmot:
- forme = corpus.getforme(forme).forme
- ucetxt = ucetxt.replace(' '+forme+' ', ' ' + forme + ' ')
- txt += ucetxt + '
'
- win.HtmlPage.SetPage(txt)
+ if self.Source.parametres['classif_mode'] != 2 :
+ for word in ListWord :
+ uci = False
+ ucef += list(set(corpus.getlemuces(word)).intersection(uces))
+ else :
+ for word in ListWord :
+ ucef += list(set(corpus.getlemucis(word)).intersection(uces))
+ uci = True
+ ucis_txt, ucestxt = doconcorde(corpus, ucef, ListWord, uci = uci)
+ items = dict([[i, '
'.join([ucis_txt[i], ucestxt[i]])] for i in range(0,len(ucestxt))])
+ win = message(self, items, title, (800, 500))
+ #win = message(self, title, size=(750, 600))
+ #win.html = ('\n%s
' % ' '.join(ListWord)) + '
'.join(['
'.join([ucis_txt[i], ucestxt[i]]) for i in range(0,len(ucestxt))]) + '\n'
+ #win.HtmlPage.SetPage(win.html)
return win
def OnPopupTwo(self, event):
- corpus = self.Source.corpus
- uces = corpus.lc[self.cl-1]
- win = self.make_concord(uces, "Concordancier - Classe %i" % self.cl)
- win.Show(True)
+ if 'corpus' in dir(self.Source) :
+ corpus = self.Source.corpus
+ uces = corpus.lc[self.cl-1]
+ win = self.make_concord(uces, "Concordancier - Classe %i" % self.cl)
+ win.Show(True)
def OnPopupThree(self, event):
corpus = self.Source.corpus
@@ -730,15 +775,20 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col
rep = []
#FIXME : donner aussi eff reel a la place de nb uce
for forme in lems[word].formes :
- ucef = list(set(corpus.getworduces(forme)).intersection(uces))
+ if self.Source.parametres['classif_mode'] != 2 :
+ ucef = list(set(corpus.getworduces(forme)).intersection(uces))
+ else :
+ ucef = list(set(corpus.getworducis(forme)).intersection(uces))
#ucef = [uce for uce in corpus.formes[forme][1] if uce in uces]
if ucef != [] :
nb = len(ucef)
rep.append([corpus.getforme(forme).forme, nb])
rep.sort(key = itemgetter(1), reverse = True)
- win = message(self, u"Formes associées", wx.Size(300, 200))
- win.html = '\n' + '
'.join([' : '.join([str(val) for val in forme]) for forme in rep]) + '\n'
- win.HtmlPage.SetPage(win.html)
+ #win = message(self, u"Formes associées", wx.Size(300, 200))
+ items = dict([[i, '\t:\t'.join([str(val) for val in forme])] for i, forme in enumerate(rep)])
+ win = message(self, items, u"Formes associées", (300, 200))
+ #win.html = '\n' + '
'.join([' : '.join([str(val) for val in forme]) for forme in rep]) + '\n'
+ #win.HtmlPage.SetPage(win.html)
win.Show(True)