mirror of
https://github.com/simon987/hexlib.git
synced 2025-04-04 02:12:59 +00:00
Remove clean_multicore function
This commit is contained in:
parent
62e74ed292
commit
cd5a1ac50c
@ -25,15 +25,6 @@ nltk.download("wordnet", quiet=True)
|
||||
lemmatizer = WordNetLemmatizer()
|
||||
|
||||
|
||||
def clean_multicore(texts, processes, chunk_size=10000, **kwargs):
|
||||
pool = Pool(processes=processes)
|
||||
yield from pool.imap(
|
||||
func=partial(preprocess, **kwargs),
|
||||
iterable=texts,
|
||||
chunksize=chunk_size
|
||||
)
|
||||
|
||||
|
||||
def _transform_bigram(ngram_seq, ngrams):
|
||||
for ngram in ngram_seq:
|
||||
if ngram in ngrams:
|
||||
|
Loading…
x
Reference in New Issue
Block a user