these-3-words/words/wordnet.py

14 lines
405 B
Python
Raw Normal View History

import nltk
import string
lemmas = nltk.corpus.wordnet.all_lemma_names()
wordnet_lemmas = list(w.lower() for w in lemmas if 4<=len(w)<9 and
not any(c in string.punctuation for c in w) and
not any(c in string.digits for c in w))
assert len(wordnet_lemmas) == len(set(wordnet_lemmas))
f = open("wordnet-list", "w")
f.write("\n".join(wordnet_lemmas))
f.close()