自然语言处理nltk分词断句(2)
from nltk.corpus import gutenbergimport nltk# file = gutenberg.words('melville-moby_dick.txt')# text = nltk.Text(file)# print(file)# print(text)# print(text.findall('<a> (<.*>) <...