HPI/my/google/takeout/paths.py
karlicoss 8c2d1c9463 general: use less explicit kompress boilerplate in modules
now get_files/kompress library can handle it transparently
2023-10-20 21:13:59 +01:00

45 lines
1.3 KiB
Python

'''
Module for locating and accessing [[https://takeout.google.com][Google Takeout]] data
'''
from dataclasses import dataclass
from ...core.common import Paths, get_files
from ...core.util import __NOT_HPI_MODULE__
from my.config import google as user_config
from more_itertools import last
@dataclass
class google(user_config):
takeout_path: Paths # path/paths/glob for the takeout zips
###
# TODO rename 'google' to 'takeout'? not sure
from ...core.cfg import make_config
config = make_config(google)
from pathlib import Path
from typing import Optional, Iterable
def get_takeouts(*, path: Optional[str]=None) -> Iterable[Path]:
"""
Sometimes google splits takeout into multiple archives, so we need to detect the ones that contain the path we need
"""
# TODO FIXME zip is not great..
# allow a lambda expression? that way the user could restrict it
for takeout in get_files(config.takeout_path, glob='*.zip'):
if path is None or (takeout / path).exists():
yield takeout
def get_last_takeout(*, path: Optional[str]=None) -> Optional[Path]:
return last(get_takeouts(path=path), default=None)
# TODO might be a good idea to merge across multiple takeouts...
# perhaps even a special takeout module that deals with all of this automatically?
# e.g. accumulate, filter and maybe report useless takeouts?