migrate background tasks to celery
This commit is contained in:
parent
efe3248c07
commit
93129333e6
7 changed files with 106 additions and 101 deletions
|
|
@ -1,4 +1,6 @@
|
|||
import asyncio
|
||||
import dataclasses
|
||||
import json
|
||||
import logging
|
||||
import logging.config
|
||||
from pathlib import Path
|
||||
|
|
@ -15,6 +17,7 @@ from api.worker import (
|
|||
task_queue,
|
||||
task_results,
|
||||
)
|
||||
from dotenv import load_dotenv
|
||||
from fastapi import Depends, FastAPI, HTTPException, Query
|
||||
from api.auth import User
|
||||
from models.listing import QueryParameters
|
||||
|
|
@ -22,11 +25,14 @@ from repositories.listing_repository import ListingRepository
|
|||
from repositories.listing_repository import ListingRepository
|
||||
from database import engine
|
||||
from fastapi.middleware.cors import CORSMiddleware
|
||||
|
||||
from tasks import listing_tasks
|
||||
from ui_exporter import export_immoweb
|
||||
from alembic import command
|
||||
from alembic.config import Config
|
||||
from contextlib import asynccontextmanager
|
||||
|
||||
load_dotenv()
|
||||
logger = logging.getLogger("uvicorn")
|
||||
|
||||
|
||||
|
|
@ -43,9 +49,6 @@ logger = logging.getLogger("uvicorn")
|
|||
# app = FastAPI(lifespan=lifespan)
|
||||
app = FastAPI()
|
||||
|
||||
# Start worker thread
|
||||
WorkerManager(DumpListingsWorker()).start()
|
||||
|
||||
|
||||
# Allow CORS (for React frontend)
|
||||
app.add_middleware(
|
||||
|
|
@ -81,19 +84,9 @@ async def refresh_listings(
|
|||
user: Annotated[User, Depends(get_current_user)],
|
||||
query_parameters: Annotated[QueryParameters, Query()],
|
||||
) -> dict[str, str]:
|
||||
# Submit processing task
|
||||
task_id = str(uuid.uuid4())
|
||||
task_results[task_id] = {"status": TaskStatus.QUEUED}
|
||||
try:
|
||||
task_queue.put_nowait(
|
||||
(task_id, query_parameters),
|
||||
)
|
||||
except queue.Full:
|
||||
raise HTTPException(
|
||||
status_code=429,
|
||||
detail="Already processing at maximum capacity. Please try again later",
|
||||
)
|
||||
return {"task_id": task_id}
|
||||
# TODO: rate limit
|
||||
task = listing_tasks.dump_listings_task.delay(query_parameters.json())
|
||||
return {"task_id": task.id}
|
||||
|
||||
|
||||
@app.get("/api/task_status")
|
||||
|
|
@ -101,6 +94,9 @@ async def get_task_status(
|
|||
user: Annotated[User, Depends(get_current_user)],
|
||||
task_id: str,
|
||||
) -> dict[str, str]:
|
||||
if task_id not in task_results:
|
||||
return {"status": "not_found"}
|
||||
return task_results[task_id]
|
||||
task_result = listing_tasks.dump_listings_task.AsyncResult(task_id)
|
||||
return {
|
||||
"task_id": task_id,
|
||||
"status": task_result.status,
|
||||
"result": json.dumps(task_result.result),
|
||||
}
|
||||
|
|
|
|||
|
|
@ -1,79 +0,0 @@
|
|||
from __future__ import annotations
|
||||
from abc import abstractmethod
|
||||
import asyncio
|
||||
import atexit
|
||||
import enum
|
||||
import importlib
|
||||
from pathlib import Path
|
||||
from queue import Queue
|
||||
import queue
|
||||
from threading import Thread
|
||||
from database import engine
|
||||
|
||||
from repositories.listing_repository import ListingRepository
|
||||
|
||||
dump_listings_module = importlib.import_module("1_dump_listings")
|
||||
|
||||
# In-memory task queue and results store
|
||||
task_queue = Queue(maxsize=1) # Disallow multiple in flight requests for now
|
||||
task_results = {}
|
||||
|
||||
|
||||
class WorkerManager:
|
||||
def __init__(self, worker: WorkerThread):
|
||||
super().__init__()
|
||||
self._worker = worker
|
||||
atexit.register(asyncio.run, self.stop())
|
||||
|
||||
async def stop(self) -> None:
|
||||
await self._worker.stop()
|
||||
self._worker_thread.join()
|
||||
|
||||
def start(self):
|
||||
self._worker_thread = Thread(
|
||||
target=asyncio.run, args=[self._worker.run()], daemon=True
|
||||
)
|
||||
self._worker_thread.start()
|
||||
|
||||
|
||||
class WorkerThread:
|
||||
@abstractmethod
|
||||
async def stop(self) -> None: ...
|
||||
|
||||
@abstractmethod
|
||||
async def run(self) -> None: ...
|
||||
|
||||
|
||||
class DumpListingsWorker(WorkerThread):
|
||||
should_stop = False
|
||||
|
||||
async def stop(self) -> None:
|
||||
self.should_stop = True
|
||||
|
||||
async def run(self) -> None: # global results is updated
|
||||
"""Background worker that processes tasks"""
|
||||
repository = ListingRepository(engine)
|
||||
data_dir_path = Path("data/rs")
|
||||
while not self.should_stop:
|
||||
task_id, task_data = task_queue.get()
|
||||
task_results[task_id] = {"status": TaskStatus.PROCESSING}
|
||||
query_parameters = task_data
|
||||
try:
|
||||
new_listings = await dump_listings_module.dump_listings_full(
|
||||
query_parameters, repository, data_dir_path
|
||||
)
|
||||
task_results[task_id] = {
|
||||
"status": "completed",
|
||||
"result": f"Fetched {len(new_listings)} new listings for query {task_data}",
|
||||
}
|
||||
except Exception as e:
|
||||
task_results[task_id] = {"status": TaskStatus.FAILED, "error": str(e)}
|
||||
finally:
|
||||
task_queue.task_done()
|
||||
|
||||
|
||||
class TaskStatus(enum.StrEnum):
|
||||
QUEUED = "queued"
|
||||
PROCESSING = "processing"
|
||||
COMPLETED = "completed"
|
||||
FAILED = "failed"
|
||||
Loading…
Add table
Add a link
Reference in a new issue