some enhancements for facebook/instagram modules

figured out that datetimes are naive
better username handling + investigation of thread names
This commit is contained in:
Dima Gerasimov 2022-06-04 10:29:50 +01:00 committed by karlicoss
parent 7323e99504
commit b9d788efd0
4 changed files with 29 additions and 13 deletions

View file

@ -38,10 +38,12 @@ class Thread:
name: Optional[str]
# todo not sure about order of fields...
from ..core import datetime_naive
@dataclass
class _BaseMessage:
id: str
dt: datetime
# checked against a message sent on 4 may 2022, and it does look naive
dt: datetime_naive
text: Optional[str]

View file

@ -43,3 +43,9 @@ def _merge_messages(*sources: Iterator[Res[Message]]) -> Iterator[Res[Message]]:
# similar to twitter, might make sense to generify/document as a pattern
return (r.id, r.dt)
yield from unique_everseen(chain(*sources), key=key)
# TODO some notes about gdpr export (since there is no module yet)
# ugh, messages seem to go from new to old in messages_N.json files as N increases :facepalm:
# seems like it's storing local timestamp :facepalm:
# checked against a message sent on 4 may 2022