Files
notifications-api/app/celery/reporting_tasks.py
Kenneth Kehl 8fa893895c cleanup
2025-07-10 14:29:46 -07:00

121 lines
4.4 KiB
Python

from datetime import datetime, timedelta
from flask import current_app
from app import notify_celery
from app.config import QueueNames
from app.dao.fact_billing_dao import fetch_billing_data_for_day, update_fact_billing
from app.dao.fact_notification_status_dao import update_fact_notification_status
from app.dao.notifications_dao import get_service_ids_with_notifications_on_date
from app.enums import NotificationType
from app.utils import utc_now
@notify_celery.task(name="create-nightly-billing")
def create_nightly_billing(day_start=None):
# day_start is a datetime.date() object. e.g.
# up to 4 days of data counting back from day_start is consolidated
if day_start is None:
day_start = utc_now().date() - timedelta(days=1)
else:
# When calling the task its a string in the format of "YYYY-MM-DD"
day_start = datetime.strptime(day_start, "%Y-%m-%d").date()
for i in range(0, 10):
process_day = (day_start - timedelta(days=i)).isoformat()
create_nightly_billing_for_day.apply_async(
kwargs={"process_day": process_day}, queue=QueueNames.REPORTING
)
current_app.logger.info(
f"create-nightly-billing task: create-nightly-billing-for-day task created for {process_day}"
)
@notify_celery.task(name="create-nightly-billing-for-day")
def create_nightly_billing_for_day(process_day):
process_day = datetime.strptime(process_day, "%Y-%m-%d").date()
current_app.logger.info(
f"create-nightly-billing-for-day task for {process_day}: started"
)
start = utc_now()
transit_data = fetch_billing_data_for_day(process_day=process_day)
end = utc_now()
current_app.logger.info(
f"create-nightly-billing-for-day task for {process_day}: data fetched in {(end - start).seconds} seconds"
)
for data in transit_data:
update_fact_billing(data, process_day)
current_app.logger.info(
f"create-nightly-billing-for-day task for {process_day}: "
f"task complete. {len(transit_data)} rows updated"
)
@notify_celery.task(name="create-nightly-notification-status")
def create_nightly_notification_status():
"""
Aggregate notification statuses into rows in ft_notification_status.
In order to minimise effort, this task assumes that:
- Email + SMS statuses don't change after 3 days. This is currently true
because all outstanding email / SMS are "timed out" after 3 days, and
we reject delivery receipts after this point.
Because the time range of the task exceeds the minimum possible retention
period (3 days), we need to choose which table to query for each service.
The aggregation happens for 1 extra day in case:
- This task or the "timeout" task fails to run.
- Data is (somehow) still in transit to the history table, which would
mean the aggregated results are temporarily incorrect.
"""
yesterday = utc_now().date() - timedelta(days=1)
for notification_type in (NotificationType.SMS, NotificationType.EMAIL):
days = 4
for i in range(days):
process_day = yesterday - timedelta(days=i)
relevant_service_ids = get_service_ids_with_notifications_on_date(
notification_type, process_day
)
for service_id in relevant_service_ids:
create_nightly_notification_status_for_service_and_day.apply_async(
kwargs={
"process_day": process_day.isoformat(),
"notification_type": notification_type,
"service_id": service_id,
},
queue=QueueNames.REPORTING,
)
@notify_celery.task(name="create-nightly-notification-status-for-service-and-day")
def create_nightly_notification_status_for_service_and_day(
process_day, service_id, notification_type
):
process_day = datetime.strptime(process_day, "%Y-%m-%d").date()
start = utc_now()
update_fact_notification_status(
process_day=process_day,
notification_type=notification_type,
service_id=service_id,
)
end = utc_now()
current_app.logger.info(
f"create-nightly-notification-status-for-service-and-day task update "
f"for {service_id}, {notification_type} for {process_day}: "
f"updated in {(end - start).seconds} seconds"
)