mirror of
https://github.com/simon987/hexlib.git
synced 2025-04-21 18:46:42 +00:00
Compare commits
2 Commits
cd5a1ac50c
...
084acbe184
Author | SHA1 | Date | |
---|---|---|---|
084acbe184 | |||
d578be3218 |
@ -34,7 +34,7 @@ class StatelessStreamWorker:
|
||||
|
||||
|
||||
class StatelessStreamProcessor:
|
||||
def __init__(self, worker_factory, chunk_size=128, processes=1):
|
||||
def __init__(self, worker_factory, chunk_size=128, processes=1, timeout=60):
|
||||
self._chunk_size = 128
|
||||
self._queue = MPQueue(maxsize=chunk_size)
|
||||
self._queue_out = MPQueue(maxsize=processes * 2)
|
||||
@ -42,6 +42,7 @@ class StatelessStreamProcessor:
|
||||
self._processes = []
|
||||
self._factory = worker_factory
|
||||
self._workers = []
|
||||
self._timeout = timeout
|
||||
|
||||
if processes > 1:
|
||||
for _ in range(processes):
|
||||
@ -67,7 +68,7 @@ class StatelessStreamProcessor:
|
||||
ingest_thread = Thread(target=self._ingest, args=(iterable,))
|
||||
ingest_thread.start()
|
||||
|
||||
for results in queue_iter(self._queue_out, joinable=False, timeout=10):
|
||||
for results in queue_iter(self._queue_out, joinable=False, timeout=self._timeout):
|
||||
yield from results
|
||||
|
||||
ingest_thread.join()
|
||||
|
@ -85,7 +85,7 @@ def ndjson_iter(*files, compression=""):
|
||||
line_iter = BufferedReader(gzip.open(file))
|
||||
elif compression == COMPRESSION_ZSTD:
|
||||
fp = open(file, "rb")
|
||||
dctx = zstandard.ZstdDecompressor()
|
||||
dctx = zstandard.ZstdDecompressor(max_window_size=2147483648)
|
||||
reader = dctx.stream_reader(fp)
|
||||
line_iter = BufferedReader(reader)
|
||||
|
||||
|
Loading…
x
Reference in New Issue
Block a user