From 1ad2a5bffabb5d9077ce278e224017e974c7a4a7 Mon Sep 17 00:00:00 2001 From: Dima Gerasimov Date: Sun, 17 Mar 2019 15:09:24 +0000 Subject: [PATCH] make parallel processing optional --- reddit/__init__.py | 11 ++++++++--- 1 file changed, 8 insertions(+), 3 deletions(-) diff --git a/reddit/__init__.py b/reddit/__init__.py index 4e6e10d..ac8d480 100755 --- a/reddit/__init__.py +++ b/reddit/__init__.py @@ -120,7 +120,7 @@ def get_state(bfile: Path) -> Dict[Sid, Save]: return OrderedDict() -def get_events(all_=True) -> List[Event]: +def get_events(all_=True, parallel=True) -> List[Event]: backups = _get_backups(all_=all_) assert len(backups) > 0 @@ -129,8 +129,13 @@ def get_events(all_=True) -> List[Event]: # TODO suppress first batch?? # TODO for initial batch, treat event time as creation time - with Pool() as p: - states = p.map(get_state, backups) + states: Iterable[Dict[Sid, Save]] + if parallel: + with Pool() as p: + states = p.map(get_state, backups) + else: + # also make it lazy... + states = map(get_state, backups) RE = re.compile(r'reddit-(\d{14})') for i, (b, saves) in enumerate(zip(backups, states)): # TODO when date...