mirror of
https://github.com/rommapp/romm.git
synced 2026-01-23 13:33:56 +08:00
Run file watcher using `opentelemetry-instrument` to enable tracing for the watcher service.
165 lines
5.7 KiB
Python
165 lines
5.7 KiB
Python
import enum
|
|
import json
|
|
import os
|
|
from collections.abc import Sequence
|
|
from datetime import timedelta
|
|
from typing import cast
|
|
|
|
import sentry_sdk
|
|
from config import (
|
|
ENABLE_RESCAN_ON_FILESYSTEM_CHANGE,
|
|
HASHEOUS_API_ENABLED,
|
|
LAUNCHBOX_API_ENABLED,
|
|
LIBRARY_BASE_PATH,
|
|
RESCAN_ON_FILESYSTEM_CHANGE_DELAY,
|
|
SENTRY_DSN,
|
|
)
|
|
from config.config_manager import config_manager as cm
|
|
from endpoints.sockets.scan import scan_platforms
|
|
from handler.database import db_platform_handler
|
|
from handler.metadata.igdb_handler import IGDB_API_ENABLED
|
|
from handler.metadata.moby_handler import MOBY_API_ENABLED
|
|
from handler.metadata.ra_handler import RA_API_ENABLED
|
|
from handler.metadata.sgdb_handler import STEAMGRIDDB_API_ENABLED
|
|
from handler.metadata.ss_handler import SS_API_ENABLED
|
|
from handler.scan_handler import MetadataSource, ScanType
|
|
from logger.formatter import CYAN
|
|
from logger.formatter import highlight as hl
|
|
from logger.logger import log
|
|
from opentelemetry import trace
|
|
from rq.job import Job
|
|
from tasks.tasks import tasks_scheduler
|
|
from utils import get_version
|
|
|
|
sentry_sdk.init(
|
|
dsn=SENTRY_DSN,
|
|
release=f"romm@{get_version()}",
|
|
)
|
|
tracer = trace.get_tracer(__name__)
|
|
|
|
structure_level = 2 if os.path.exists(cm.get_config().HIGH_PRIO_STRUCTURE_PATH) else 1
|
|
|
|
|
|
@enum.unique
|
|
class EventType(enum.StrEnum):
|
|
ADDED = "added"
|
|
MODIFIED = "modified"
|
|
DELETED = "deleted"
|
|
|
|
|
|
VALID_EVENTS = frozenset(
|
|
(
|
|
EventType.ADDED,
|
|
EventType.DELETED,
|
|
)
|
|
)
|
|
|
|
# A change is a tuple representing a file change, first element is the event type, second is the
|
|
# path of the file or directory that changed.
|
|
Change = tuple[EventType, str]
|
|
|
|
|
|
def process_changes(changes: Sequence[Change]) -> None:
|
|
if not ENABLE_RESCAN_ON_FILESYSTEM_CHANGE:
|
|
return
|
|
|
|
# Filter for valid events.
|
|
changes = [change for change in changes if change[0] in VALID_EVENTS]
|
|
if not changes:
|
|
return
|
|
|
|
with tracer.start_as_current_span("process_changes"):
|
|
# Find affected platform slugs.
|
|
fs_slugs: set[str] = set()
|
|
changes_platform_directory = False
|
|
for change in changes:
|
|
event_type, change_path = change
|
|
src_path = os.fsdecode(change_path)
|
|
event_src = src_path.split(LIBRARY_BASE_PATH)[-1]
|
|
event_src_parts = event_src.split("/")
|
|
if len(event_src_parts) <= structure_level:
|
|
log.warning(
|
|
f"Filesystem event path '{event_src}' does not have enough segments for structure_level {structure_level}. Skipping event."
|
|
)
|
|
continue
|
|
|
|
if len(event_src_parts) == structure_level + 1:
|
|
changes_platform_directory = True
|
|
|
|
log.info(f"Filesystem event: {event_type} {event_src}")
|
|
fs_slugs.add(event_src_parts[structure_level])
|
|
|
|
if not fs_slugs:
|
|
log.info("No valid filesystem slugs found in changes, exiting...")
|
|
return
|
|
|
|
# Check whether any metadata source is enabled.
|
|
source_mapping: dict[str, bool] = {
|
|
MetadataSource.IGDB: IGDB_API_ENABLED,
|
|
MetadataSource.SS: SS_API_ENABLED,
|
|
MetadataSource.MOBY: MOBY_API_ENABLED,
|
|
MetadataSource.RA: RA_API_ENABLED,
|
|
MetadataSource.LB: LAUNCHBOX_API_ENABLED,
|
|
MetadataSource.HASHEOUS: HASHEOUS_API_ENABLED,
|
|
MetadataSource.SGDB: STEAMGRIDDB_API_ENABLED,
|
|
}
|
|
metadata_sources = [source for source, flag in source_mapping.items() if flag]
|
|
if not metadata_sources:
|
|
log.warning("No metadata sources enabled, skipping rescan")
|
|
return
|
|
|
|
# Get currently scheduled jobs for the scan_platforms function.
|
|
already_scheduled_jobs = [
|
|
job
|
|
for job in tasks_scheduler.get_jobs()
|
|
if isinstance(job, Job)
|
|
and job.func_name == "endpoints.sockets.scan.scan_platforms"
|
|
]
|
|
|
|
# If a full rescan is already scheduled, skip further processing.
|
|
if any(job.args[0] == [] for job in already_scheduled_jobs):
|
|
log.info("Full rescan already scheduled")
|
|
return
|
|
|
|
time_delta = timedelta(minutes=RESCAN_ON_FILESYSTEM_CHANGE_DELAY)
|
|
rescan_in_msg = f"rescanning in {hl(str(RESCAN_ON_FILESYSTEM_CHANGE_DELAY), color=CYAN)} minutes."
|
|
|
|
# Any change to a platform directory should trigger a full rescan.
|
|
if changes_platform_directory:
|
|
log.info(f"Platform directory changed, {rescan_in_msg}")
|
|
tasks_scheduler.enqueue_in(
|
|
time_delta,
|
|
scan_platforms,
|
|
[],
|
|
scan_type=ScanType.UNIDENTIFIED,
|
|
metadata_sources=metadata_sources,
|
|
)
|
|
return
|
|
|
|
# Otherwise, process each platform slug.
|
|
for fs_slug in fs_slugs:
|
|
# TODO: Query platforms from the database in bulk.
|
|
db_platform = db_platform_handler.get_platform_by_fs_slug(fs_slug)
|
|
if not db_platform:
|
|
continue
|
|
|
|
# Skip if a scan is already scheduled for this platform.
|
|
if any(db_platform.id in job.args[0] for job in already_scheduled_jobs):
|
|
log.info(f"Scan already scheduled for {hl(fs_slug)}")
|
|
continue
|
|
|
|
log.info(f"Change detected in {hl(fs_slug)} folder, {rescan_in_msg}")
|
|
tasks_scheduler.enqueue_in(
|
|
time_delta,
|
|
scan_platforms,
|
|
[db_platform.id],
|
|
scan_type=ScanType.QUICK,
|
|
metadata_sources=metadata_sources,
|
|
)
|
|
|
|
|
|
if __name__ == "__main__":
|
|
changes = cast(list[Change], json.loads(os.getenv("WATCHFILES_CHANGES", "[]")))
|
|
if changes:
|
|
process_changes(changes)
|