python 统计文章单词个数 -2
-
xychong123
2017-03-16 13:56:46
-
IT综合
-
原创
-
lines_count = 0
-
words_count = 0
-
chars_count = 0
-
words_dict = {}
-
lines_list = []
-
c1 = ['!', '?', ';', '.', ',']
-
all_line = ''
-
import collections
-
-
with open('c:\invalid.txt', 'r') as f:
-
for line in f:
-
line = line.strip('\n')
-
lines_count = lines_count + 1
-
all_line=all_line+line.lower()
-
# print line
-
#print all_line
-
for i in c1:
-
all_line=all_line.replace(i,' ')
-
# print all_line
-
str1=all_line.split(' ')
-
for i in str1:
-
if i not in words_dict:
-
words_dict[i] = 1
-
else:
-
words_dict[i] = words_dict[i] + 1
-
-
for k, v in words_dict.items():
-
print k, v