MediaProcessing/apps/py-metadata/worker/poller.py
2026-01-29 23:32:00 +01:00

83 lines
2.9 KiB
Python

import asyncio
import time
import uuid
from typing import Optional
from db.database import Database
from db.repository import (
claim_task,
fetch_next_task,
mark_failed,
persist_event_and_mark_consumed
)
from models.event import MetadataSearchResultEvent
from worker.processor import process_task
from utils.logger import logger
from models.task import MetadataSearchTask, Task
# Viktig: dette er heartbeat_ref fra app.py
from app import set_heartbeat as heartbeat_ref
def run_iteration(db: Database, worker_id: str, poll_interval: int) -> tuple[int, int]:
"""
Kjør én iterasjon av poller-loopen.
Returnerer (sleep_interval, next_poll_interval).
"""
try:
task: Optional[Task] = fetch_next_task(db)
if task:
# Worker er aktiv → ikke i backoff
heartbeat_ref(time.time(), in_backoff=False, error=None)
if not isinstance(task, MetadataSearchTask):
logger.warning(f"⚠️ Ukjent task-type {type(task)} for {task.taskId}, hopper over.")
return poll_interval, poll_interval
if not claim_task(db, str(task.taskId), worker_id):
logger.info(f"⏩ Task {task.taskId} ble claimet av en annen worker.")
return poll_interval, poll_interval
logger.info(f"🔔 Fant task {task.taskId} ({task.task}), claimed by {worker_id}")
try:
event: MetadataSearchResultEvent = asyncio.run(process_task(db, task))
if event:
persist_event_and_mark_consumed(db, event, str(task.taskId))
logger.info(f"✅ Task {task.taskId} ferdig prosessert")
else:
raise RuntimeError("process_task returned nothing!")
except Exception as task_error:
logger.error(f"❌ Task {task.taskId} feilet: {task_error}")
mark_failed(db, str(task.taskId))
heartbeat_ref(time.time(), in_backoff=False, error=str(task_error))
# Etter en task → reset poll interval
return poll_interval, 5
else:
# Ingen tasks → worker går i backoff
logger.debug("Ingen nye tasks.")
heartbeat_ref(time.time(), in_backoff=True, error=None)
return poll_interval, min(poll_interval * 2, 60)
except Exception as e:
logger.error(f"⚠️ Feil i worker: {e}")
db.connect()
heartbeat_ref(time.time(), in_backoff=True, error=str(e))
return poll_interval, 5
def run_worker(db: Database, shutdown_flag_ref=lambda: False) -> None:
poll_interval: int = 5
worker_id = f"PyMetadata-{uuid.uuid4()}"
while not shutdown_flag_ref():
sleep_interval, poll_interval = run_iteration(db, worker_id, poll_interval)
time.sleep(sleep_interval)
logger.info("👋 run_worker loop avsluttet")
db.close()