diff options
| author | A Farzat <a@farzat.xyz> | 2025-08-21 09:41:56 +0300 | 
|---|---|---|
| committer | A Farzat <a@farzat.xyz> | 2025-08-21 09:41:56 +0300 | 
| commit | 69bcc9822c82ee6d726c98deafbdd0a20527a55a (patch) | |
| tree | e51ee23b3da922e1baf7bd57f5c724e928c70d86 /data-collection/components/subscriptions | |
| parent | b141aa29f28c4e4281415b97dac8fe548b128f9b (diff) | |
| download | csca5028-69bcc9822c82ee6d726c98deafbdd0a20527a55a.tar.gz csca5028-69bcc9822c82ee6d726c98deafbdd0a20527a55a.zip | |
Move components to root directory
Some components might be shared with other applications such as the data
analyser later on.
Diffstat (limited to 'data-collection/components/subscriptions')
| -rw-r--r-- | data-collection/components/subscriptions/main.py | 64 | ||||
| -rw-r--r-- | data-collection/components/subscriptions/typing.py | 13 | 
2 files changed, 0 insertions, 77 deletions
| diff --git a/data-collection/components/subscriptions/main.py b/data-collection/components/subscriptions/main.py deleted file mode 100644 index 26b0c64..0000000 --- a/data-collection/components/subscriptions/main.py +++ /dev/null @@ -1,64 +0,0 @@ -from dataclasses import dataclass, field, asdict -from datetime import datetime, UTC -from sys import stderr -from typing import TypedDict, List, cast -from bson.objectid import ObjectId -from feedparser import parse # type: ignore -from pymongo.collection import Collection -from pymongo.results import InsertOneResult, UpdateResult -import schedule -from components.database import subscriptions -from components.subscriptions.typing import SubsDict -from components.videos import VideoTuple - -@dataclass -class Subscription: -    _id: str -    link: str -    time_between_fetches: int -    last_fetch: datetime = datetime.min.replace(tzinfo=UTC) -    last_video_update: datetime = datetime.min.replace(tzinfo=UTC) -    videos: List[VideoTuple] = field(default_factory=list) -    subscribers: List[ObjectId] = field(default_factory=list) - -    def __post_init__(self) -> None: -        self._job: schedule.Job = schedule.every(self.time_between_fetches).minutes.do(self.fetch) -        self._collection: Collection[SubsDict] = subscriptions -        self._in_db: bool = False - -    def fetch(self) -> None: -        try: -            rss = parse(self.link) -        except Exception as e: -            print("Ran into an exception while fetching", self._id + ":", e, file=stderr) -            return -        for vid in map(VideoTuple.from_rss_entry, rss.entries): -            if vid.published > self.last_video_update: -                self.videos.append(vid) -            elif vid.updated > self.last_video_update: -                for i, old_vid in enumerate(self.videos): -                    if vid.id == old_vid.id: -                        self.videos[i] = vid -                        break -        last_video_update = max((vid.updated for vid in self.videos)) -        if last_video_update > self.last_video_update: -            print("Updating", self._id) -            self.last_video_update = last_video_update -            self.update_videos() -        self.last_fetch = datetime.now(tz=UTC) - -    def asdict(self) -> SubsDict: -        return cast(SubsDict, asdict(self)) - -    def insert(self) -> InsertOneResult: -        return self._collection.insert_one(self.asdict()) - -    def update_videos(self) -> UpdateResult: -        return self._collection.update_one( -            {"_id": self._id}, -            {"$set": { -                "videos": self.videos, -                "last_video_update": self.last_video_update, -                "last_fetch": self.last_fetch, -            }}, -        ) diff --git a/data-collection/components/subscriptions/typing.py b/data-collection/components/subscriptions/typing.py deleted file mode 100644 index 8f2a298..0000000 --- a/data-collection/components/subscriptions/typing.py +++ /dev/null @@ -1,13 +0,0 @@ -from datetime import datetime -from typing import TypedDict, List -from bson.objectid import ObjectId -from components.videos import VideoTuple - -class SubsDict(TypedDict): -    _id: str -    link: str -    time_between_fetches: int # In minutes. -    last_fetch: datetime -    last_video_update: datetime -    videos: List[VideoTuple] -    subscribers: List[ObjectId] | 
