summaryrefslogtreecommitdiff
path: root/data-collection/components/subscriptions/main.py
diff options
context:
space:
mode:
authorA Farzat <a@farzat.xyz>2025-08-21 09:41:56 +0300
committerA Farzat <a@farzat.xyz>2025-08-21 09:41:56 +0300
commit69bcc9822c82ee6d726c98deafbdd0a20527a55a (patch)
treee51ee23b3da922e1baf7bd57f5c724e928c70d86 /data-collection/components/subscriptions/main.py
parentb141aa29f28c4e4281415b97dac8fe548b128f9b (diff)
downloadcsca5028-69bcc9822c82ee6d726c98deafbdd0a20527a55a.tar.gz
csca5028-69bcc9822c82ee6d726c98deafbdd0a20527a55a.zip
Move components to root directory
Some components might be shared with other applications such as the data analyser later on.
Diffstat (limited to 'data-collection/components/subscriptions/main.py')
-rw-r--r--data-collection/components/subscriptions/main.py64
1 files changed, 0 insertions, 64 deletions
diff --git a/data-collection/components/subscriptions/main.py b/data-collection/components/subscriptions/main.py
deleted file mode 100644
index 26b0c64..0000000
--- a/data-collection/components/subscriptions/main.py
+++ /dev/null
@@ -1,64 +0,0 @@
-from dataclasses import dataclass, field, asdict
-from datetime import datetime, UTC
-from sys import stderr
-from typing import TypedDict, List, cast
-from bson.objectid import ObjectId
-from feedparser import parse # type: ignore
-from pymongo.collection import Collection
-from pymongo.results import InsertOneResult, UpdateResult
-import schedule
-from components.database import subscriptions
-from components.subscriptions.typing import SubsDict
-from components.videos import VideoTuple
-
-@dataclass
-class Subscription:
- _id: str
- link: str
- time_between_fetches: int
- last_fetch: datetime = datetime.min.replace(tzinfo=UTC)
- last_video_update: datetime = datetime.min.replace(tzinfo=UTC)
- videos: List[VideoTuple] = field(default_factory=list)
- subscribers: List[ObjectId] = field(default_factory=list)
-
- def __post_init__(self) -> None:
- self._job: schedule.Job = schedule.every(self.time_between_fetches).minutes.do(self.fetch)
- self._collection: Collection[SubsDict] = subscriptions
- self._in_db: bool = False
-
- def fetch(self) -> None:
- try:
- rss = parse(self.link)
- except Exception as e:
- print("Ran into an exception while fetching", self._id + ":", e, file=stderr)
- return
- for vid in map(VideoTuple.from_rss_entry, rss.entries):
- if vid.published > self.last_video_update:
- self.videos.append(vid)
- elif vid.updated > self.last_video_update:
- for i, old_vid in enumerate(self.videos):
- if vid.id == old_vid.id:
- self.videos[i] = vid
- break
- last_video_update = max((vid.updated for vid in self.videos))
- if last_video_update > self.last_video_update:
- print("Updating", self._id)
- self.last_video_update = last_video_update
- self.update_videos()
- self.last_fetch = datetime.now(tz=UTC)
-
- def asdict(self) -> SubsDict:
- return cast(SubsDict, asdict(self))
-
- def insert(self) -> InsertOneResult:
- return self._collection.insert_one(self.asdict())
-
- def update_videos(self) -> UpdateResult:
- return self._collection.update_one(
- {"_id": self._id},
- {"$set": {
- "videos": self.videos,
- "last_video_update": self.last_video_update,
- "last_fetch": self.last_fetch,
- }},
- )