This is my code:
import os
import collections
def make_dictionary(train_dir):
emails=[os.path.join(train_dir,f) for f in os.listdir(train_dir)]
all_words=[]
for mail in emails:
with open(mail) as m:
for i,line in enumerate(m):
if i==2: #Body of email is only 3rd line of text file
words=line.split()
all_words+=words
dictionary=collections.Counter(all_words)
# Paste code for non-word removal here(code snippet is given below)
list_to_remove=dictionary.keys()
for item in list_to_remove:
if item.isalpha()==False:
del dictionary[item]
elif len(item)==1:
del dictionary[item]
dictionary=dictionary.mostcommon[3000]
print (dictionary)
make_dictionary('G:\Engineering\Projects\Python\Documents\enron1\ham')
I am receiving the error "RuntimeError: dictionary changed size during iteration" on writing this code. I have only text files in the directory. Any help will be appreciated.