X-Git-Url: http://iramuteq.org/git?p=iramuteq;a=blobdiff_plain;f=ProfList.py;h=1bc2c609b8a4ca4a69336ecd2b7e61bc617b9d2e;hp=213ae68258897c2cfb72cfe9b94bea4d01b91f89;hb=bd8d0a889d1d393e64a6d768dc14e9c639a0df8c;hpb=adc24190c47d42d5fa02f074516fc331950d8c5c diff --git a/ProfList.py b/ProfList.py index 213ae68..1bc2c60 100644 --- a/ProfList.py +++ b/ProfList.py @@ -24,13 +24,14 @@ from dialog import PrefExport, PrefUCECarac, SearchDial, message from tableau import Tableau from search_tools import SearchFrame import webbrowser -import cStringIO +#import cStringIO import tempfile import codecs -from functions import exec_rcode, MessageImage, progressbar, treat_var_mod +from functions import exec_rcode, MessageImage, progressbar, treat_var_mod, doconcorde from PrintRScript import barplot from textclassechd import ClasseCHD from shutil import copyfile +from operator import itemgetter #--------------------------------------------------------------------------- class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.ColumnSorterMixin): @@ -100,7 +101,7 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col self.InsertColumn(0, "num", wx.LIST_FORMAT_RIGHT) - self.InsertColumn(1, "eff. uce", wx.LIST_FORMAT_RIGHT) + self.InsertColumn(1, "eff. s.t.", wx.LIST_FORMAT_RIGHT) self.InsertColumn(2, "eff. total", wx.LIST_FORMAT_RIGHT) self.InsertColumn(3, "pourcentage", wx.LIST_FORMAT_RIGHT) self.InsertColumn(4, "chi2", wx.LIST_FORMAT_RIGHT) @@ -133,7 +134,7 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col #events #self.Bind(wx.EVT_LIST_ITEM_SELECTED, self.OnItemSelected) - #self.Bind(wx.EVT_LIST_ITEM_ACTIVATED, self.OnItemActivated) + self.Bind(wx.EVT_LIST_ITEM_ACTIVATED, self.OnPopupTwo, self) #self.Bind(wx.EVT_LIST_ITEM_DESELECTED, self.OnItemDeselected) self.Bind(wx.EVT_LIST_COL_CLICK, self.OnColClick) @@ -146,6 +147,7 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col #for searching search_id = wx.NewId() searchall_id = wx.NewId() + concord_id = wx.NewId() self.parent.Bind(wx.EVT_MENU, self.onsearch, id = search_id) self.parent.Bind(wx.EVT_MENU, self.onsearchall, id = searchall_id) self.accel_tbl = wx.AcceleratorTable([(wx.ACCEL_CTRL, ord('F'), search_id), @@ -236,16 +238,16 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col def onsearch(self, evt) : self.dial = SearchDial(self, self, 6, True) self.dial.CenterOnParent() - self.dial.ShowModal() - self.dial.Destroy() + self.dial.Show() + #self.dial.Destroy() def onsearchall(self, evt) : if 'FrameSearch' not in dir(self.Source) : self.Source.FrameSearch = SearchFrame(self.parent, -1, u"Rechercher...", self.Source.corpus) self.dial = SearchDial(self, self.Source.FrameSearch.liste, 1, False) self.dial.CenterOnParent() - self.dial.ShowModal() - self.dial.Destroy() + self.dial.Show() + #self.dial.Destroy() def OnRightClick(self, event): @@ -270,7 +272,10 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col self.idwordgraph = wx.NewId() self.popup_proxe = wx.NewId() self.idlexdendro = wx.NewId() + self.idcloud = wx.NewId() self.idexport = wx.NewId() + self.idexporttropes = wx.NewId() + self.idexportowledge = wx.NewId() # self.export_classes = wx.NewId() self.Bind(wx.EVT_MENU, self.OnPopupOne, id=self.popupID1) @@ -291,7 +296,10 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col self.Bind(wx.EVT_MENU, self.onwordgraph, id = self.idwordgraph) self.Bind(wx.EVT_MENU, self.onproxe, id = self.popup_proxe) self.Bind(wx.EVT_MENU, self.onlexdendro, id = self.idlexdendro) + self.Bind(wx.EVT_MENU, self.oncloud, id = self.idcloud) self.Bind(wx.EVT_MENU, self.onexport, id = self.idexport) + self.Bind(wx.EVT_MENU, self.onexporttropes, id = self.idexporttropes) + self.Bind(wx.EVT_MENU, self.onexportowledge, id = self.idexportowledge) # self.Bind(wx.EVT_MENU, self.on_export_classes, id = self.export_classes) # self.Bind(wx.EVT_MENU, self.OnPopupThree, id=self.popupID3) @@ -307,9 +315,9 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col #menu.Append(self.popupID10, u"Spécificités") menu_conc = wx.Menu() - menu_conc.Append(self.popupID2, u"dans les uce de la classe") - menu_conc.Append(self.popupID3, u"dans les uce classées") - menu_conc.Append(self.popupID4, u"dans toutes les uce") + menu_conc.Append(self.popupID2, u"dans les segments de texte de la classe") + menu_conc.Append(self.popupID3, u"dans les segments de texte classés") + menu_conc.Append(self.popupID4, u"dans tous les segments de texte") menu.AppendMenu(-1, u"Concordancier", menu_conc) menu_cnrtl = wx.Menu() menu_cnrtl.Append(self.popupID5, u"Définition") @@ -322,8 +330,11 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col menu.AppendSeparator() menu.Append(self.popupIDgraph, u"Graphe de la classe") menu.Append(self.idseg, u"Segments répétés") - menu.Append(self.iducecarac, u"UCE caractéristiques") - menu.Append(self.idexport, 'Partitionner...') + menu.Append(self.iducecarac, u"Segments de texte caractéristiques") + menu.Append(self.idcloud, u"Nuage de la classe") + menu.Append(self.idexport, u'Exporter...') + menu.Append(self.idexporttropes, 'Exporter pour Tropes') + menu.Append(self.idexportowledge, 'Exporter pour Owledge') #menu.Append(self.popupID2, u"Concordancier") # menu.Append(self.popupID3, "recharger") @@ -346,10 +357,56 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col self.PopupMenu(menu) menu.Destroy() + def oncloud(self, evt) : + if 'corpus' in dir(self.Source): + corpus = self.Source.corpus + prof = [[self.la[i], self.lchi[i], self.lfreq[i]] for i, val in enumerate(self.la)] + parametres = self.Source.parametres + parametres['clusterprof'] = prof + parametres['type'] = 'clustercloud' + parametres['prof'] = self.Source.pathout['actprof_classe_%i.csv' % self.cl] + del parametres['uuid'] + #if not os.path.exists(self.Source.pathout['actprof_classe_%i.csv' % self.lc]) : + # with open(self.Source.pathout['actprof_classe_%i.csv' % self.lc], 'w') as f : + # f.write('\n'.join(prof).encode(self.parent.syscoding)) + self.parent.OnClusterCloud(self.Source.corpus, parametres = parametres) + def onexport(self, evt) : if 'corpus' in dir(self.Source): corpus = self.Source.corpus - ClasseCHD(self.parent, corpus, self.cl) + if self.Source.parametres['classif_mode'] != 2 : + uci = False + else : + uci = True + corpus.export_classe(self.Source.pathout['classe_%i_export.txt' % self.cl], self.cl, uci = uci) + dial = wx.MessageDialog(self, self.Source.pathout['classe_%i_export.txt' % self.cl], u"Export", wx.OK|wx.ICON_INFORMATION) + dial.ShowModal() + dial.Destroy() + #if 'corpus' in dir(self.Source): + # corpus = self.Source.corpus + #ClasseCHD(self.parent, corpus, self.cl) + + def onexporttropes(self, evt) : + if 'corpus' in dir(self.Source): + corpus = self.Source.corpus + if self.Source.parametres['classif_mode'] != 2 : + uci = False + else : + uci = True + fileout = self.Source.pathout['export_tropes_classe_%i.txt' % self.cl] + corpus.export_tropes(fileout, self.cl, uci = uci) + + def onexportowledge(self, evt): + if 'corpus' in dir(self.Source): + corpus = self.Source.corpus + if self.Source.parametres['classif_mode'] != 2 : + uci = False + else : + uci = True + repout = self.Source.pathout['export_owledge_classe_%i' % self.cl] + if not os.path.exists(repout) : + os.mkdir(repout) + corpus.export_owledge(repout, self.cl, uci = uci) def getselectedwords(self) : words = [self.getColumnText(self.GetFirstSelected(), 6)] @@ -409,6 +466,10 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col tableau = self.Source.tableau tab = tableau.make_table_from_classe(self.cl, self.la) pathout = ConstructPathOut(self.Source.pathout.dirout, 'simi_classe_%i' %self.cl) + if self.tmpchi is None : + self.tmpchi = os.path.join(pathout,'chi.csv') + with open(self.tmpchi, 'w') as f: + f.write('\n'.join([str(val) for val in self.lchi])) self.filename = os.path.join(pathout,'mat01.csv') tableau.printtable(self.filename, tab) del tab @@ -444,15 +505,9 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col 'film': False, 'com' : 0, 'communities' : 0, - 'halo' : 0 + 'halo' : 0, + 'tmpchi': self.tmpchi } -# self.tableau.actives = {} -# self.tableau.lchi = self.lchi -# self.tableau.chi = {} -# for i, val in enumerate(self.la) : -# self.tableau.actives[val] = [self.lfreq[i]] -# self.tableau.chi[val] = [self.lchi[i]] - act = {} tableau.chi = {} tableau.lchi = self.lchi @@ -465,7 +520,7 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col def onwordgraph(self, evt): word = self.getColumnText(self.GetFirstSelected(), 6) if self.tmpchi is None : - self.tmpchi = tempfile.mktemp(dir=self.Source.parent.TEMPDIR) + self.tmpchi = os.path.join(self.Source.parametres['pathout'],'chi_%i.csv' % self.cl) with open(self.tmpchi, 'w') as f: f.write('\n'.join([str(val) for val in self.lchi])) index = self.la.index(word) @@ -481,7 +536,7 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col def on_graph(self, evt): if self.tmpchi is None : - self.tmpchi = tempfile.mktemp(dir=self.Source.parent.TEMPDIR) + self.tmpchi = os.path.join(self.Source.parametres['pathout'],'chi_%i.csv' % self.cl) with open(self.tmpchi, 'w') as f: f.write('\n'.join([str(val) for val in self.lchi])) parametres = {'type' : 'clustersimitxt', @@ -490,68 +545,19 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col 'tmpchi' : self.tmpchi} self.parent.SimiFromCluster(self.parent, self.Source.corpus, self.la, self.lfreq, self.lchi, self.cl - 1, parametres = parametres, dlg = progressbar(self, 4)) - #dlg = progressbar(self, 2) - #corpus = self.Source.corpus - #uces = corpus.lc[self.cl-1] - #dlg.Update(1, u'Tableau...') - ##tab = corpus.make_table_with_classe(uces, self.la) - #pathout = ConstructPathOut(self.Source.pathout.dirout+'/', 'simi_classe_%i' %self.cl) - #self.filename = os.path.join(pathout,'mat01.csv') - #dlg.Update(2, u'Ecriture...') - ##corpus.write_tab(tab, self.filename) - ##del tab - #corpus.make_and_write_sparse_matrix_from_classe(self.la, uces, self.filename) - #dlg.Destroy() - #paramsimi = {'coeff' : 0, - # 'layout' : 2, - # 'type' : 1, - # 'arbremax' : 1, - # 'coeff_tv' : 1, - # 'coeff_tv_nb' : 0, - # 'tvprop' : 0, - # 'tvmin' : 5, - # 'tvmax' : 30, - # 'coeff_te' : 1, - # 'coeff_temin' : 1, - # 'coeff_temax' : 10, - # 'label_v': 1, - # 'label_e': 0, - # 'vcex' : 0, - # 'vcexmin' : 10, - # 'vcexmax' : 25, - # 'cex' : 10, - # 'cexfromchi' : True, - # 'sfromchi': False, - # 'seuil_ok' : 0, - # 'seuil' : 1, - # 'cols' : (255,0,0), - # 'cola' : (200,200,200), - # 'width' : 1000, - # 'height' : 1000, - # 'first' : True, - # 'keep_coord' : True, - # 'alpha' : 20, - # 'film': False, - # } - #self.tableau = Tableau(self.parent, '') - #self.tableau.listactives = self.la - #self.tableau.actives = {} - #self.tableau.lchi = self.lchi - #self.tableau.chi = {} - #self.tableau.parametre['fromprof'] = True - #for i, val in enumerate(self.la) : - # self.tableau.actives[val] = [self.lfreq[i]] - # self.tableau.chi[val] = [self.lchi[i]] - #DoSimi(self, param = paramsimi, fromprof = ffr(self.filename), pathout = pathout) def on_segments(self,evt) : dlg = progressbar(self, 2) corpus = self.Source.corpus uces = corpus.lc[self.cl-1] + if self.Source.parametres['classif_mode'] != 2 : + uci = False + else : + uci = True l = [] dlg.Update(1, u'Segments...') for i in range(2,10) : - li = corpus.find_segments_in_classe(uces, i, 1000) + li = corpus.find_segments_in_classe(uces, i, 1000, uci = uci) if li == [] : break else : @@ -576,7 +582,11 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col dlg = progressbar(self,maxi = 4) corpus = self.Source.corpus uces = corpus.lc[self.cl-1] - tab = corpus.make_table_with_classe(uces, self.la) + if self.Source.parametres['classif_mode'] != 2 : + uci = False + else : + uci = True + tab = corpus.make_table_with_classe(uces, self.la, uci = uci) tab.pop(0) dlg.Update(2, u'score...') if atype == 0 : @@ -589,24 +599,10 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col ntab2 = ntab2[:limite] nuces = [val[1] for val in ntab2] dlg.Update(3, u'concordancier...') - #ucestxt = [corpus.ucis_paras_uces[val[1][0]][val[1][1]][val[1][2]] for val in ntab2] - ucestxt1 = [row for row in corpus.getconcorde(nuces)] - ucestxt = [] - ucis_txt = [] - for uce in ucestxt1 : - ucetxt = ' '+uce[1]+' ' - ucis_txt.append(' '.join(corpus.ucis[corpus.getucefromid(uce[0]).uci].etoiles) + '
') - for lem in self.la : - listmot = corpus.getlems()[lem].formes - for id in listmot : - forme = corpus.getforme(id).forme - ucetxt = ucetxt.replace(' '+forme+' ', ' ' + forme + ' ') - ucestxt.append(ucetxt) - #ucestxt = [corpus.make_concord(self.la, ' '.join(uce), 'red') for uce in ucestxt] + ucis_txt, ucestxt = doconcorde(corpus, nuces, self.la, uci = uci) dlg.Update(4, u'texte...') - #ucis_txt = [' '.join(corpus.ucis[val[1][0]][0]) for val in ntab2] - win = message(self, u"UCE caractéristiques - Classe %i" % self.cl, (750, 600)) - win.html = '\n' + '

'.join(['
'.join([ucis_txt[i], 'score : ' + str(ntab2[i][0]), ucestxt[i]]) for i in range(0,len(ucestxt))]) + '\n' + win = message(self, u"Segments de texte caractéristiques - Classe %i" % self.cl, (750, 600)) + win.html = '\n' + '
'.join(['
'.join([ucis_txt[i], '
score : %.2f
' % ntab2[i][0], ucestxt[i]]) for i in range(0,len(ucestxt))]) + '\n' win.HtmlPage.SetPage(win.html) dlg.Destroy() win.Show(True) @@ -629,6 +625,12 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col nbcl = len(title) nbwords = len(words) txt = barplot(tableout, words, title, self.Source.parent.RscriptsPath['Rgraph'], tmpgraph) + #print 'ATTENTION TEST R' + #txt = """ + #sink('/Users/pierre/Desktop/qdfqsdfqsdfqsdf.txt') + #Sys.getlocale() + #sink() + #""" tmpscript = tempfile.mktemp(dir=self.Source.parent.TEMPDIR) file = open(tmpscript,'w') file.write(txt) @@ -689,7 +691,6 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col win.HtmlPage.SetPage(txt) win.Show(True) - def make_concord(self, uces, title, color = 'red') : corpus = self.Source.corpus ListWord = [self.getColumnText(self.GetFirstSelected(), 6)] @@ -697,26 +698,19 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col while self.GetNextSelected(last) != -1: last = self.GetNextSelected(last) ListWord.append(self.getColumnText(last, 6)) - listmot = [forme for item in ListWord for forme in corpus.getlems()[item].formes] - win = message(self, title, size=(750, 600)) - toshow = ['\n

Concordancier

\n'] - toshow.append('

' % color + ' '.join(ListWord) + '


') - duce = {} ucef = [] - for word in ListWord : - ucef += list(set(corpus.getlemuces(word)).intersection(uces)) - ucef = list(set(ucef)) - ucef.sort() - res = corpus.getconcorde(ucef) - txt = '
'.join(toshow) +'

' - for uce in res : - ucetxt = ' '+uce[1]+' ' - txt += ' '.join(corpus.ucis[corpus.getucefromid(uce[0]).uci].etoiles) + '
' - for forme in listmot: - forme = corpus.getforme(forme).forme - ucetxt = ucetxt.replace(' '+forme+' ', ' ' + forme + ' ') - txt += ucetxt + '

' - win.HtmlPage.SetPage(txt) + if self.Source.parametres['classif_mode'] != 2 : + for word in ListWord : + uci = False + ucef += list(set(corpus.getlemuces(word)).intersection(uces)) + else : + for word in ListWord : + ucef += list(set(corpus.getlemucis(word)).intersection(uces)) + uci = True + ucis_txt, ucestxt = doconcorde(corpus, ucef, ListWord, uci = uci) + win = message(self, title, size=(750, 600)) + win.html = ('\n

%s

' % ' '.join(ListWord)) + '
'.join(['
'.join([ucis_txt[i], ucestxt[i]]) for i in range(0,len(ucestxt))]) + '\n' + win.HtmlPage.SetPage(win.html) return win def OnPopupTwo(self, event): @@ -777,12 +771,42 @@ class ProfListctrlPanel(wx.ListCtrl, listmix.ListCtrlAutoWidthMixin, listmix.Col rep = [] #FIXME : donner aussi eff reel a la place de nb uce for forme in lems[word].formes : - ucef = list(set(corpus.getworduces(forme)).intersection(uces)) + if self.Source.parametres['classif_mode'] != 2 : + ucef = list(set(corpus.getworduces(forme)).intersection(uces)) + else : + ucef = list(set(corpus.getworducis(forme)).intersection(uces)) #ucef = [uce for uce in corpus.formes[forme][1] if uce in uces] if ucef != [] : nb = len(ucef) rep.append([corpus.getforme(forme).forme, nb]) + rep.sort(key = itemgetter(1), reverse = True) win = message(self, u"Formes associées", wx.Size(300, 200)) win.html = '\n' + '
'.join([' : '.join([str(val) for val in forme]) for forme in rep]) + '\n' win.HtmlPage.SetPage(win.html) win.Show(True) + + +class wliste(wx.Frame): + def __init__(self, parent, id, title, d, fline, size=(600, 500)): + wx.Frame.__init__(self, parent, id) + self.liste = ListForSpec(self, parent, d, fline, menu = False) + self.button_1 = wx.Button(self, -1, "Fermer") + self.Bind(wx.EVT_BUTTON, self.OnCloseMe, self.button_1) + self.Bind(wx.EVT_CLOSE, self.OnCloseWindow) + self.__do_layout() + + def __do_layout(self): + sizer_1 = wx.BoxSizer(wx.VERTICAL) + sizer_2 = wx.BoxSizer(wx.VERTICAL) + sizer_2.Add(self.liste, 1, wx.EXPAND | wx.ADJUST_MINSIZE, 0) + sizer_2.Add(self.button_1, 0, wx.ALIGN_CENTER_HORIZONTAL | wx.ADJUST_MINSIZE, 0) + sizer_1.Add(sizer_2, 1, wx.EXPAND, 0) + self.SetAutoLayout(True) + self.SetSizer(sizer_1) + self.Layout() + + def OnCloseMe(self, event): + self.Close(True) + + def OnCloseWindow(self, event): + self.Destroy()