#coding:utf-8
#import string
# -*- coding: utf-8 -*-
import docx
import re
dict = {}
file_path ='dear.docx'
doc = docx.Document(file_path)
for paragraphin doc.paragraphs:
s1 = paragraph.text
s2 = re.sub(r'[,.""?!]'," ",s1).lower()
for wordin s2.split():
#print word
dict.setdefault(word,0)
if wordin dict:
dict[word] +=1
print dict
![](https://img.haomeiwen.com/i10820970/cd0ba9365a2ba905.png)
网友评论