core.common: move stats-related stuff to my.core.stats and add more thorough tests/docs

deprecate core.common.stat and core.common.Stats with backwards compatibility
2024-08-15 17:51:46 +03:00 · 2024-08-15 17:51:46 +03:00 · c45c51af22
commit c45c51af22
parent 18529257e7
14 changed files with 343 additions and 246 deletions
--- a/my/calendar/holidays.py
+++ b/my/calendar/holidays.py
@ -9,7 +9,8 @@ from datetime import date, datetime, timedelta
 from functools import lru_cache
 from typing import Union

-from ..core.time import zone_to_countrycode
+from my.core import Stats
+from my.core.time import zone_to_countrycode


@lru_cache(1)
@ -46,7 +47,6 @@ def is_workday(d: DateIsh) -> bool:
    return not is_holiday(d)


-from ..core.common import Stats
 def stats() -> Stats:
    # meh, but not sure what would be a better test?
    res = {}
--- a/my/core/init.py
+++ b/my/core/init.py
@ -1,7 +1,7 @@
 # this file only keeps the most common & critical types/utility functions
 from .common import get_files, PathIsh, Paths
 from .common import Json
-from .common import stat, Stats
+from .stats import stat, Stats
 from .common import datetime_naive, datetime_aware
 from .compat import assert_never
 from .utils.itertools import warn_if_empty
--- a/my/core/main.py
+++ b/my/core/main.py
@ -243,9 +243,8 @@ def modules_check(*, verbose: bool, list_all: bool, quick: bool, for_modules: Li

    import contextlib

-    from .common import quick_stats
-    from .util import get_stats, HPIModule
-    from .stats import guess_stats
+    from .util import HPIModule
+    from .stats import get_stats, quick_stats
    from .error import warn_my_config_import_error

    mods: Iterable[HPIModule]
@ -276,11 +275,8 @@ def modules_check(*, verbose: bool, list_all: bool, quick: bool, for_modules: Li
            continue

        info(f'{click.style("OK", fg="green")}  : {m:<50}')
-        # first try explicitly defined stats function:
-        stats = get_stats(m)
-        if stats is None:
-            # then try guessing.. not sure if should log somehow?
-            stats = guess_stats(m, quick=quick)
+        # TODO add hpi 'stats'? instead of doctor? not sure
+        stats = get_stats(m, guess=True)

        if stats is None:
            eprint("       - no 'stats' function, can't check the data")
@ -291,6 +287,7 @@ def modules_check(*, verbose: bool, list_all: bool, quick: bool, for_modules: Li

        try:
            kwargs = {}
+            # todo hmm why wouldn't they be callable??
            if callable(stats) and 'quick' in inspect.signature(stats).parameters:
                kwargs['quick'] = quick
            with quick_context:
--- a/my/core/common.py
+++ b/my/core/common.py
@ -3,7 +3,6 @@ from pathlib import Path
 from datetime import datetime
 from dataclasses import is_dataclass, asdict as dataclasses_asdict
 import functools
-from contextlib import contextmanager
 import os
 from typing import (
    Any,
@ -11,13 +10,11 @@ from typing import (
    Dict,
    Iterable,
    List,
-    Optional,
    Sequence,
    TYPE_CHECKING,
    Tuple,
    TypeVar,
    Union,
-    cast,
 )
 import warnings

@ -179,183 +176,6 @@ def get_valid_filename(s: str) -> str:
    return re.sub(r'(?u)[^-\w.]', '', s)


-# global state that turns on/off quick stats
-# can use the 'quick_stats' contextmanager
-# to enable/disable this in cli so that module 'stats'
-# functions don't have to implement custom 'quick' logic
-QUICK_STATS = False
-
-
-# in case user wants to use the stats functions/quick option
-# elsewhere -- can use this decorator instead of editing
-# the global state directly
-@contextmanager
-def quick_stats():
-    global QUICK_STATS
-    prev = QUICK_STATS
-    try:
-        QUICK_STATS = True
-        yield
-    finally:
-        QUICK_STATS = prev
-
-
-C = TypeVar('C')
-Stats = Dict[str, Any]
-StatsFun = Callable[[], Stats]
-# todo not sure about return type...
-def stat(
-    func: Union[Callable[[], Iterable[C]], Iterable[C]],
-    *,
-    quick: bool = False,
-    name: Optional[str] = None,
-) -> Stats:
-    if callable(func):
-        fr = func()
-        if hasattr(fr, '__enter__') and hasattr(fr, '__exit__'):
-            # context managers has Iterable type, but they aren't data providers
-            # sadly doesn't look like there is a way to tell from typing annotations
-            return {}
-        fname = func.__name__
-    else:
-        # meh. means it's just a list.. not sure how to generate a name then
-        fr = func
-        fname = f'unnamed_{id(fr)}'
-    type_name = type(fr).__name__
-    if type_name == 'DataFrame':
-        # dynamic, because pandas is an optional dependency..
-        df = cast(Any, fr)  # todo ugh, not sure how to annotate properly
-        res = dict(
-            dtypes=df.dtypes.to_dict(),
-            rows=len(df),
-        )
-    else:
-        res = _stat_iterable(fr, quick=quick)
-
-    stat_name = name if name is not None else fname
-    return {
-        stat_name: res,
-    }
-
-
-def _stat_iterable(it: Iterable[C], quick: bool = False) -> Any:
-    from more_itertools import ilen, take, first
-
-    # todo not sure if there is something in more_itertools to compute this?
-    total = 0
-    errors = 0
-    first_item = None
-    last_item = None
-
-    def funcit():
-        nonlocal errors, first_item, last_item, total
-        for x in it:
-            total += 1
-            if isinstance(x, Exception):
-                errors += 1
-            else:
-                last_item = x
-                if first_item is None:
-                    first_item = x
-            yield x
-
-    eit = funcit()
-    count: Any
-    if quick or QUICK_STATS:
-        initial = take(100, eit)
-        count = len(initial)
-        if first(eit, None) is not None: # todo can actually be none...
-            # haven't exhausted
-            count = f'{count}+'
-    else:
-        count = ilen(eit)
-
-    res = {
-        'count': count,
-    }
-
-    if total == 0:
-        # not sure but I guess a good balance? wouldn't want to throw early here?
-        res['warning'] = 'THE ITERABLE RETURNED NO DATA'
-
-    if errors > 0:
-        res['errors'] = errors
-
-    def stat_item(item):
-        if item is None:
-            return None
-        if isinstance(item, Path):
-            return str(item)
-        return guess_datetime(item)
-
-    if (stat_first := stat_item(first_item)) is not None:
-        res['first'] = stat_first
-
-    if (stat_last := stat_item(last_item)) is not None:
-        res['last'] = stat_last
-
-    return res
-
-
-def test_stat_iterable() -> None:
-    from datetime import datetime, timedelta, timezone
-    from typing import NamedTuple
-
-    dd = datetime.fromtimestamp(123, tz=timezone.utc)
-    day = timedelta(days=3)
-
-    X = NamedTuple('X', [('x', int), ('d', datetime)])
-
-    def it():
-        yield RuntimeError('oops!')
-        for i in range(2):
-            yield X(x=i, d=dd + day * i)
-        yield RuntimeError('bad!')
-        for i in range(3):
-            yield X(x=i * 10, d=dd + day * (i * 10))
-        yield X(x=123, d=dd + day * 50)
-
-    res = _stat_iterable(it())
-    assert res['count']  == 1 + 2 + 1 + 3 + 1
-    assert res['errors'] == 1 + 1
-    assert res['last'] == dd + day * 50
-
-
-# experimental, not sure about it..
-def guess_datetime(x: Any) -> Optional[datetime]:
-    # todo hmm implement withoutexception..
-    try:
-        d = asdict(x)
-    except: # noqa: E722 bare except
-        return None
-    for k, v in d.items():
-        if isinstance(v, datetime):
-            return v
-    return None
-
-def test_guess_datetime() -> None:
-    from datetime import datetime
-    from dataclasses import dataclass
-    from typing import NamedTuple
-
-    dd = compat.fromisoformat('2021-02-01T12:34:56Z')
-
-    # ugh.. https://github.com/python/mypy/issues/7281
-    A = NamedTuple('A', [('x', int)])
-    B = NamedTuple('B', [('x', int), ('created', datetime)])
-
-    assert guess_datetime(A(x=4)) is None
-    assert guess_datetime(B(x=4, created=dd)) == dd
-
-    @dataclass
-    class C:
-        a: datetime
-        x: int
-    assert guess_datetime(C(a=dd, x=435)) == dd
-    # TODO not sure what to return when multiple datetime fields?
-    # TODO test @property?
-
-
 def is_namedtuple(thing: Any) -> bool:
    # basic check to see if this is namedtuple-like
    _asdict = getattr(thing, '_asdict', None)
@ -389,6 +209,9 @@ from .utils.itertools import unique_everseen
 ## hiding behind TYPE_CHECKING so it works in runtime
 ## in principle, warnings.deprecated decorator should cooperate with mypy, but doesn't look like it works atm?
 ## perhaps it doesn't work when it's used from typing_extensions
+
+from .compat import Never
+
 if not TYPE_CHECKING:

    @deprecated('use my.core.compat.assert_never instead')
@ -439,6 +262,12 @@ if not TYPE_CHECKING:

        return UI.listify(*args, **kwargs)

+    @deprecated('use my.core.stat instead')
+    def stat(*args, **kwargs):
+        from . import stats
+
+        return stats.stat(*args, **kwargs)
+
    # todo wrap these in deprecated decorator as well?
    from .cachew import mcachew  # noqa: F401

@ -447,7 +276,7 @@ if not TYPE_CHECKING:
    # TODO hmm how to deprecate it in runtime? tricky cause it's actually a class?
    tzdatetime = datetime_aware
 else:
-    from .compat import Never
-
    tzdatetime = Never  # makes it invalid as a type while working in runtime
+
+Stats = Never
 ###
--- a/my/core/stats.py
+++ b/my/core/stats.py
@ -1,23 +1,181 @@
 '''
 Helpers for hpi doctor/stats functionality.
 '''
+
 import collections
+from contextlib import contextmanager
+from datetime import datetime
 import importlib
 import inspect
+from pathlib import Path
+from types import ModuleType
 import typing
-from typing import Optional, Callable, Any, Iterator, Sequence, Dict, List
+from typing import (
+    Any,
+    Callable,
+    Dict,
+    Iterable,
+    Iterator,
+    List,
+    Optional,
+    Protocol,
+    Sequence,
+    Union,
+    cast,
+)

-from .common import StatsFun, Stats, stat
+
+Stats = Dict[str, Any]
+
+
+class StatsFun(Protocol):
+    def __call__(self, quick: bool = False) -> Stats: ...
+
+
+# global state that turns on/off quick stats
+# can use the 'quick_stats' contextmanager
+# to enable/disable this in cli so that module 'stats'
+# functions don't have to implement custom 'quick' logic
+QUICK_STATS = False
+
+
+# in case user wants to use the stats functions/quick option
+# elsewhere -- can use this decorator instead of editing
+# the global state directly
+@contextmanager
+def quick_stats():
+    global QUICK_STATS
+    prev = QUICK_STATS
+    try:
+        QUICK_STATS = True
+        yield
+    finally:
+        QUICK_STATS = prev
+
+
+def stat(
+    func: Union[Callable[[], Iterable[Any]], Iterable[Any]],
+    *,
+    quick: bool = False,
+    name: Optional[str] = None,
+) -> Stats:
+    """
+    Extracts various statistics from a passed iterable/callable, e.g.:
+    - number of items
+    - first/last item
+    - timestamps associated with first/last item
+
+    If quick is set, then only first 100 items of the iterable will be processed
+    """
+    if callable(func):
+        fr = func()
+        if hasattr(fr, '__enter__') and hasattr(fr, '__exit__'):
+            # context managers has Iterable type, but they aren't data providers
+            #  sadly doesn't look like there is a way to tell from typing annotations
+            # Ideally we'd detect this in is_data_provider...
+            #  but there is no way of knowing without actually calling it first :(
+            return {}
+        fname = func.__name__
+    else:
+        # meh. means it's just a list.. not sure how to generate a name then
+        fr = func
+        fname = f'unnamed_{id(fr)}'
+    type_name = type(fr).__name__
+    extras = {}
+    if type_name == 'DataFrame':
+        # dynamic, because pandas is an optional dependency..
+        df = cast(Any, fr)  # todo ugh, not sure how to annotate properly
+        df = df.reset_index()
+
+        fr = df.to_dict(orient='records')
+
+        dtypes = df.dtypes.to_dict()
+        extras['dtypes'] = dtypes
+
+    res = _stat_iterable(fr, quick=quick)
+    res.update(extras)
+
+    stat_name = name if name is not None else fname
+    return {
+        stat_name: res,
+    }
+
+
+def test_stat() -> None:
+    # the bulk of testing is in test_stat_iterable
+
+    # works with 'anonymous' lists
+    res = stat([1, 2, 3])
+    [(name, v)] = res.items()
+    # note: name will be a little funny since anonymous list doesn't have one
+    assert v == {'count': 3}
+    #
+
+    # works with functions:
+    def fun():
+        return [4, 5, 6]
+
+    assert stat(fun) == {'fun': {'count': 3}}
+    #
+
+    # context managers are technically iterable
+    #  , but usually we wouldn't want to compute stats for them
+    # this is mainly intended for guess_stats,
+    #  since it can't tell whether the function is a ctx manager without calling it
+    @contextmanager
+    def cm():
+        yield 1
+        yield 3
+
+    assert stat(cm) == {}  # type: ignore[arg-type]
+    #
+
+    # works with pandas dataframes
+    import pandas as pd
+    import numpy as np
+
+    def df() -> pd.DataFrame:
+        dates = pd.date_range(start='2024-02-10 08:00', end='2024-02-11 16:00', freq='5h')
+        return pd.DataFrame([f'value{i}' for i, _ in enumerate(dates)], index=dates, columns=['value'])
+
+    assert stat(df) == {
+        'df': {
+            'count': 7,
+            'dtypes': {
+                'index': np.dtype('<M8[ns]'),
+                'value': np.dtype('O'),
+            },
+            'first': pd.Timestamp('2024-02-10 08:00'),
+            'last': pd.Timestamp('2024-02-11 14:00'),
+        },
+    }
+    #
+
+
+def get_stats(module_name: str, *, guess: bool = False) -> Optional[StatsFun]:
+    stats: Optional[StatsFun] = None
+    try:
+        module = importlib.import_module(module_name)
+    except Exception:
+        return None
+    stats = getattr(module, 'stats', None)
+    if stats is None:
+        stats = guess_stats(module)
+    return stats


 # TODO maybe could be enough to annotate OUTPUTS or something like that?
 # then stats could just use them as hints?
-def guess_stats(module_name: str, quick: bool = False) -> Optional[StatsFun]:
-    providers = guess_data_providers(module_name)
+def guess_stats(module: ModuleType) -> Optional[StatsFun]:
+    """
+    If the module doesn't have explicitly defined 'stat' function,
+     this is used to try to guess what could be included in stats automatically
+    """
+    providers = _guess_data_providers(module)
    if len(providers) == 0:
        return None

-    def auto_stats() -> Stats:
+    def auto_stats(quick: bool = False) -> Stats:
        res = {}
        for k, v in providers.items():
            res.update(stat(v, quick=quick, name=k))
@ -27,12 +185,11 @@ def guess_stats(module_name: str, quick: bool = False) -> Optional[StatsFun]:


 def test_guess_stats() -> None:
-    from datetime import datetime
    import my.core.tests.auto_stats as M

-    auto_stats = guess_stats(M.__name__)
+    auto_stats = guess_stats(M)
    assert auto_stats is not None
-    res = auto_stats()
+    res = auto_stats(quick=False)

    assert res == {
        'inputs': {
@ -48,15 +205,15 @@ def test_guess_stats() -> None:
    }


-def guess_data_providers(module_name: str) -> Dict[str, Callable]:
-    module = importlib.import_module(module_name)
+def _guess_data_providers(module: ModuleType) -> Dict[str, Callable]:
    mfunctions = inspect.getmembers(module, inspect.isfunction)
    return {k: v for k, v in mfunctions if is_data_provider(v)}


-# todo how to exclude deprecated stuff?
+# todo how to exclude deprecated data providers?
 def is_data_provider(fun: Any) -> bool:
    """
+    Criteria for being a "data provider":
    1. returns iterable or something like that
    2. takes no arguments? (otherwise not callable by stats anyway?)
    3. doesn't start with an underscore (those are probably helper functions?)
@ -72,7 +229,7 @@ def is_data_provider(fun: Any) -> bool:
        return False

    # has at least one argument without default values
-    if len(list(sig_required_params(sig))) > 0:
+    if len(list(_sig_required_params(sig))) > 0:
        return False

    if hasattr(fun, '__name__'):
@ -88,7 +245,7 @@ def is_data_provider(fun: Any) -> bool:
    if return_type is None:
        return False

-    return type_is_iterable(return_type)
+    return _type_is_iterable(return_type)


 def test_is_data_provider() -> None:
@ -99,6 +256,7 @@ def test_is_data_provider() -> None:

    def no_return_type():
        return [1, 2, 3]
+
    assert not idp(no_return_type)

    lam = lambda: [1, 2]
@ -106,27 +264,34 @@ def test_is_data_provider() -> None:

    def has_extra_args(count) -> List[int]:
        return list(range(count))
+
    assert not idp(has_extra_args)

    def has_return_type() -> Sequence[str]:
        return ['a', 'b', 'c']
+
    assert idp(has_return_type)

    def _helper_func() -> Iterator[Any]:
        yield 1
+
    assert not idp(_helper_func)

    def inputs() -> Iterator[Any]:
        yield 1
+
    assert idp(inputs)

    def producer_inputs() -> Iterator[Any]:
        yield 1
+
    assert idp(producer_inputs)


-# return any parameters the user is required to provide - those which don't have default values
-def sig_required_params(sig: inspect.Signature) -> Iterator[inspect.Parameter]:
+def _sig_required_params(sig: inspect.Signature) -> Iterator[inspect.Parameter]:
+    """
+    Returns parameters the user is required to provide - e.g. ones that don't have default values
+    """
    for param in sig.parameters.values():
        if param.default == inspect.Parameter.empty:
            yield param
@ -136,21 +301,24 @@ def test_sig_required_params() -> None:

    def x() -> int:
        return 5
-    assert len(list(sig_required_params(inspect.signature(x)))) == 0
+
+    assert len(list(_sig_required_params(inspect.signature(x)))) == 0

    def y(arg: int) -> int:
        return arg
-    assert len(list(sig_required_params(inspect.signature(y)))) == 1
+
+    assert len(list(_sig_required_params(inspect.signature(y)))) == 1

    # from stats perspective, this should be treated as a data provider as well
    # could be that the default value to the data provider is the 'default'
    # path to use for inputs/a function to provide input data
    def z(arg: int = 5) -> int:
        return arg
-    assert len(list(sig_required_params(inspect.signature(z)))) == 0
+
+    assert len(list(_sig_required_params(inspect.signature(z)))) == 0


-def type_is_iterable(type_spec) -> bool:
+def _type_is_iterable(type_spec) -> bool:
    origin = typing.get_origin(type_spec)
    if origin is None:
        return False
@ -167,9 +335,7 @@ def type_is_iterable(type_spec) -> bool:

 # todo docstring test?
 def test_type_is_iterable() -> None:
-    from typing import List, Sequence, Iterable, Dict, Any
-
-    fun = type_is_iterable
+    fun = _type_is_iterable
    assert not fun(None)
    assert not fun(int)
    assert not fun(Any)
@ -178,3 +344,126 @@ def test_type_is_iterable() -> None:
    assert fun(List[int])
    assert fun(Sequence[Dict[str, str]])
    assert fun(Iterable[Any])
+
+
+def _stat_item(item):
+    if item is None:
+        return None
+    if isinstance(item, Path):
+        return str(item)
+    return _guess_datetime(item)
+
+
+def _stat_iterable(it: Iterable[Any], quick: bool = False) -> Stats:
+    from more_itertools import ilen, take, first
+
+    # todo not sure if there is something in more_itertools to compute this?
+    total = 0
+    errors = 0
+    first_item = None
+    last_item = None
+
+    def funcit():
+        nonlocal errors, first_item, last_item, total
+        for x in it:
+            total += 1
+            if isinstance(x, Exception):
+                errors += 1
+            else:
+                last_item = x
+                if first_item is None:
+                    first_item = x
+            yield x
+
+    eit = funcit()
+    count: Any
+    if quick or QUICK_STATS:
+        initial = take(100, eit)
+        count = len(initial)
+        if first(eit, None) is not None:  # todo can actually be none...
+            # haven't exhausted
+            count = f'{count}+'
+    else:
+        count = ilen(eit)
+
+    res = {
+        'count': count,
+    }
+
+    if total == 0:
+        # not sure but I guess a good balance? wouldn't want to throw early here?
+        res['warning'] = 'THE ITERABLE RETURNED NO DATA'
+
+    if errors > 0:
+        res['errors'] = errors
+
+    if (stat_first := _stat_item(first_item)) is not None:
+        res['first'] = stat_first
+
+    if (stat_last := _stat_item(last_item)) is not None:
+        res['last'] = stat_last
+
+    return res
+
+
+def test_stat_iterable() -> None:
+    from datetime import datetime, timedelta, timezone
+    from typing import NamedTuple
+
+    dd = datetime.fromtimestamp(123, tz=timezone.utc)
+    day = timedelta(days=3)
+
+    X = NamedTuple('X', [('x', int), ('d', datetime)])
+
+    def it():
+        yield RuntimeError('oops!')
+        for i in range(2):
+            yield X(x=i, d=dd + day * i)
+        yield RuntimeError('bad!')
+        for i in range(3):
+            yield X(x=i * 10, d=dd + day * (i * 10))
+        yield X(x=123, d=dd + day * 50)
+
+    res = _stat_iterable(it())
+    assert res['count'] == 1 + 2 + 1 + 3 + 1
+    assert res['errors'] == 1 + 1
+    assert res['last'] == dd + day * 50
+
+
+# experimental, not sure about it..
+def _guess_datetime(x: Any) -> Optional[datetime]:
+    from .common import asdict  # avoid circular imports
+
+    # todo hmm implement without exception..
+    try:
+        d = asdict(x)
+    except:  # noqa: E722 bare except
+        return None
+    for k, v in d.items():
+        if isinstance(v, datetime):
+            return v
+    return None
+
+
+def test_guess_datetime() -> None:
+    from dataclasses import dataclass
+    from typing import NamedTuple
+    from .compat import fromisoformat
+
+    dd = fromisoformat('2021-02-01T12:34:56Z')
+
+    # ugh.. https://github.com/python/mypy/issues/7281
+    A = NamedTuple('A', [('x', int)])
+    B = NamedTuple('B', [('x', int), ('created', datetime)])
+
+    assert _guess_datetime(A(x=4)) is None
+    assert _guess_datetime(B(x=4, created=dd)) == dd
+
+    @dataclass
+    class C:
+        a: datetime
+        x: int
+
+    assert _guess_datetime(C(a=dd, x=435)) == dd
+    # TODO not sure what to return when multiple datetime fields?
+    # TODO test @property?
--- a/my/core/util.py
+++ b/my/core/util.py
@ -1,6 +1,5 @@
 from pathlib import Path
 from itertools import chain
-from importlib import import_module
 import os
 import pkgutil
 import sys
@ -15,17 +14,6 @@ def modules() -> Iterable[HPIModule]:
        yield m


-from .common import StatsFun
-def get_stats(module: str) -> Optional[StatsFun]:
-    # todo detect via ast?
-    try:
-        mod = import_module(module)
-    except Exception:
-        return None
-
-    return getattr(mod, 'stats', None)
-
-
 __NOT_HPI_MODULE__ = 'Import this to mark a python file as a helper, not an actual HPI module'
 from .discovery_pure import NOT_HPI_MODULE_VAR
 assert NOT_HPI_MODULE_VAR in globals()  # check name consistency
--- a/my/google/takeout/parser.py
+++ b/my/google/takeout/parser.py
@ -18,9 +18,9 @@ from contextlib import ExitStack
 import os
 from typing import List, Sequence, cast
 from pathlib import Path
-from my.core import make_config, dataclass
+from my.core import make_config, dataclass, stat, Stats
 from my.core.cachew import mcachew
-from my.core.common import Stats, LazyLogger, get_files, Paths
+from my.core.common import LazyLogger, get_files, Paths
 from my.core.error import ErrorPolicy
 from my.core.structure import match_structure

@ -133,8 +133,6 @@ def events(disable_takeout_cache: bool = DISABLE_TAKEOUT_CACHE) -> CacheResults:


 def stats() -> Stats:
-    from my.core import stat
-
    return {
        **stat(events),
    }
--- a/my/location/google.py
+++ b/my/location/google.py
@ -19,6 +19,7 @@ import re
 # pip3 install geopy
 import geopy # type: ignore

+from my.core import stat, Stats
 from my.core.common import LazyLogger
 from my.core.cachew import cache_dir, mcachew

@ -164,7 +165,6 @@ def locations(**kwargs) -> Iterable[Location]:
    return _iter_locations(path=last_takeout, **kwargs)


-from ..core.common import stat, Stats
 def stats() -> Stats:
    return stat(locations)

--- a/my/location/google_takeout.py
+++ b/my/location/google_takeout.py
@ -9,8 +9,8 @@ from typing import Iterator
 from my.google.takeout.parser import events, _cachew_depends_on
 from google_takeout_parser.models import Location as GoogleLocation

+from my.core import stat, Stats, LazyLogger
 from my.core.cachew import mcachew
-from my.core.common import LazyLogger, stat, Stats
 from .common import Location

 logger = LazyLogger(__name__)
--- a/my/location/google_takeout_semantic.py
+++ b/my/location/google_takeout_semantic.py
@ -12,9 +12,8 @@ from typing import Iterator, List
 from my.google.takeout.parser import events, _cachew_depends_on as _parser_cachew_depends_on
 from google_takeout_parser.models import PlaceVisit as SemanticLocation

-from my.core import dataclass, make_config
+from my.core import dataclass, make_config, stat, LazyLogger, Stats
 from my.core.cachew import mcachew
-from my.core.common import LazyLogger, Stats, stat
 from my.core.error import Res
 from .common import Location

--- a/my/reddit/all.py
+++ b/my/reddit/all.py
@ -1,5 +1,5 @@
 from typing import Iterator
-from my.core.common import Stats
+from my.core import stat, Stats
 from my.core.source import import_source

 from .common import Save, Upvote, Comment, Submission, _merge_comments
@ -58,7 +58,6 @@ def upvoted() -> Iterator[Upvote]:
    yield from upvoted()

 def stats() -> Stats:
-    from my.core import stat
    return {
        **stat(saved),
        **stat(comments),
--- a/my/reddit/pushshift.py
+++ b/my/reddit/pushshift.py
@ -8,8 +8,9 @@ REQUIRES = [
    "git+https://github.com/seanbreckenridge/pushshift_comment_export",
 ]

-from my.core.common import Paths, Stats
 from dataclasses import dataclass
+
+from my.core import Paths, Stats, stat
 from my.core.cfg import make_config

 # note: keeping pushshift import before config import, so it's handled gracefully by import_source
@ -43,7 +44,6 @@ def comments() -> Iterator[PComment]:
        yield from read_file(f)

 def stats() -> Stats:
-    from my.core import stat
    return {
        **stat(comments)
    }
--- a/my/rescuetime.py
+++ b/my/rescuetime.py
@ -9,7 +9,7 @@ from pathlib import Path
 from datetime import timedelta
 from typing import Sequence, Iterable

-from my.core import get_files, make_logger
+from my.core import get_files, make_logger, stat, Stats
 from my.core.cachew import mcachew
 from my.core.error import Res, split_errors

@ -47,7 +47,6 @@ def dataframe() -> DataFrameT:
    return as_dataframe(entries())


-from .core import stat, Stats
 def stats() -> Stats:
    return {
        **stat(groups),
--- a/my/smscalls.py
+++ b/my/smscalls.py
@ -7,7 +7,9 @@ Exported using https://play.google.com/store/apps/details?id=com.riteshsahu.SMSB

 REQUIRES = ['lxml']

-from .core import Paths, dataclass
+from dataclasses import dataclass
+
+from my.core import get_files, stat, Paths, Stats
 from my.config import smscalls as user_config

@dataclass
@ -15,7 +17,7 @@ class smscalls(user_config):
    # path[s] that SMSBackupRestore syncs XML files to
    export_path: Paths

-from .core.cfg import make_config
+from my.core.cfg import make_config
 config = make_config(smscalls)

 from datetime import datetime, timezone
@ -24,7 +26,6 @@ from typing import NamedTuple, Iterator, Set, Tuple, Optional, Any, Dict, List

 from lxml import etree

-from my.core.common import get_files, Stats
 from my.core.error import Res


@ -316,8 +317,6 @@ def _parse_dt_ms(d: str) -> datetime:


 def stats() -> Stats:
-    from .core import stat
-
    return {
        **stat(calls),
        **stat(messages),