1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31
|
import nltk
import PyQt4
from PyQt4 import QtGui, QtCore
from PyQt4.QtGui import*
listfile = [PyQt4.QtCore.QString(u'C:\\Users------\Desktop\\doc\\doc1.txt'), PyQt4.QtCore.QString(u'C:\\Users-------Desktop\\doc\\doc2.txt'), PyQt4.QtCore.QString(u'C:\\Users\\------Desktop\\doc\\doc3.txt')]
punc=('!','.',':',',')
dictfile={}
listFile=[]
listmot=[]
for mot in listfile:
listFile.append(mot)
for j in range(len(listFile)):
f=open(listFile[j],'r')
t=f.read()
t=t.lower()
for punct in punc:
t = t.replace(punct," ")
listmot=t.split(" ")
dictfile[str(listFile[j].split('\\')[-1])]= listmot
print 't ************ ',t
print 'listmot *************',listmot
print 'dictfile************** ',dictfile
print dictfile['doc2.txt'] |
Partager