mirror of
https://github.com/simon987/hexlib.git
synced 2025-04-10 14:06:43 +00:00
ignore log in text
This commit is contained in:
parent
d895ac837e
commit
18cd59fc4a
@ -1,5 +1,4 @@
|
||||
import nltk.corpus
|
||||
from hexlib.misc import silent_stderr
|
||||
from lxml import etree
|
||||
from nltk.corpus import stopwords
|
||||
from nltk.stem import WordNetLemmatizer
|
||||
@ -10,9 +9,8 @@ get_text = etree.XPath("//text()")
|
||||
|
||||
stop_words_en = set(stopwords.words("english"))
|
||||
|
||||
with silent_stderr:
|
||||
nltk.download("stopwords")
|
||||
nltk.download("wordnet")
|
||||
nltk.download("stopwords", quiet=True)
|
||||
nltk.download("wordnet", quiet=True)
|
||||
|
||||
lemmatizer = WordNetLemmatizer()
|
||||
|
||||
|
Loading…
x
Reference in New Issue
Block a user