14 lines
405 B
Python
14 lines
405 B
Python
import nltk
|
|
import string
|
|
|
|
|
|
lemmas = nltk.corpus.wordnet.all_lemma_names()
|
|
wordnet_lemmas = list(w.lower() for w in lemmas if 4<=len(w)<9 and
|
|
not any(c in string.punctuation for c in w) and
|
|
not any(c in string.digits for c in w))
|
|
assert len(wordnet_lemmas) == len(set(wordnet_lemmas))
|
|
|
|
f = open("wordnet-list", "w")
|
|
f.write("\n".join(wordnet_lemmas))
|
|
f.close()
|