python nltk模块正在创建它自己的错误

时间:2018-01-29 19:35:50

标签: python nltk


from nltk.corpus import stopwords
from nltk.tokenize import word_tokenize

example_sent = "This is a sample sentence, showing off the stop words filtration."

stop_words = set(stopwords.words('english'))

word_tokens = word_tokenize(example_sent)

filtered_sentence = [w for w in word_tokens if not w in stop_words]

filtered_sentence = []

for w in word_tokens:
    if w not in stop_words:



File "/Users/nicolas/Desktop/part 1 natural lenguage/", line 1, in <module>
    from nltk.tokenize import sent_tokenize, word_tokenize
  File "/Library/Python/2.7/site-packages/nltk/", line 114, in <module>
    from nltk.collocations import *
  File "/Library/Python/2.7/site-packages/nltk/", line 37, in <module>
    from nltk.probability import FreqDist
  File "/Library/Python/2.7/site-packages/nltk/", line 47, in <module>
    from collections import defaultdict, Counter
  File "/Library/Python/2.7/site-packages/nltk/", line 13, in <module>
    import pydoc
  File "/System/Library/Frameworks/Python.framework/Versions/2.7/lib/python2.7/", line 56, in <module>
    import sys, imp, os, re, types, inspect, __builtin__, pkgutil, warnings
  File "/System/Library/Frameworks/Python.framework/Versions/2.7/lib/python2.7/", line 39, in <module>
    import tokenize
  File "/Users/nicolas/Desktop/part 1 natural lenguage/", line 1, in <module>
    from nltk.corpus import stopwords
  File "/Library/Python/2.7/site-packages/nltk/corpus/", line 64, in <module>
    from nltk.tokenize import RegexpTokenizer
  File "/Library/Python/2.7/site-packages/nltk/tokenize/", line 67, in <module>
    from nltk.tokenize.mwe      import MWETokenizer
  File "/Library/Python/2.7/site-packages/nltk/tokenize/", line 31, in <module>
    from nltk.util import Trie
  File "/Library/Python/2.7/site-packages/nltk/", line 21, in <module>
    from collections import defaultdict, deque
ImportError: cannot import name defaultdict
iMac-di-Monica:part 1 natural lenguage nicolas$ 


from nltk.tokenize import sent_tokenize, word_tokenize

EXAMPLE_TEXT = "Hello Mr. Smith, how are you doing today? The weather is great, and Python is awesome. The sky is pinkish-blue. You shouldn't eat cardboard."


for i in word_tokenize(EXAMPLE_TEXT) :
    print (i)


0 个答案:
