Revert running status aggregation in parallel

The top-level task didn't run successfully after this was deployed due to the worker being killed due to heavy disk usage. While the more parallel version does log much more, it doesn't totally explain the disk behaviour. Nonetheless, reverting it is sensible to give us the time we need to investigate more.
2026-01-31 15:15:38 -05:00 · 2022-01-20 10:39:23 +00:00
parent 0a88724ff5
commit 0f6dea0deb
3 changed files with 44 additions and 45 deletions
--- a/app/celery/reporting_tasks.py
+++ b/app/celery/reporting_tasks.py
@@ -3,7 +3,7 @@ from datetime import datetime, timedelta
 from flask import current_app
 from notifications_utils.timezones import convert_utc_to_bst

-from app import db, notify_celery
+from app import notify_celery
 from app.config import QueueNames
 from app.cronitor import cronitor
 from app.dao.fact_billing_dao import (
@@ -91,46 +91,47 @@ def create_nightly_notification_status():

    yesterday = convert_utc_to_bst(datetime.utcnow()).date() - timedelta(days=1)

-    for (service_id,) in db.session.query(Service.id):
-        for notification_type in [SMS_TYPE, EMAIL_TYPE, LETTER_TYPE]:
-            days = 10 if notification_type == LETTER_TYPE else 4
+    for notification_type in [SMS_TYPE, EMAIL_TYPE, LETTER_TYPE]:
+        days = 10 if notification_type == LETTER_TYPE else 4

-            for i in range(days):
-                process_day = yesterday - timedelta(days=i)
+        for i in range(days):
+            process_day = yesterday - timedelta(days=i)

-                create_nightly_notification_status_for_service_and_day.apply_async(
-                    kwargs={
-                        'process_day': process_day.isoformat(),
-                        'notification_type': notification_type,
-                        'service_id': service_id,
-                    },
-                    queue=QueueNames.REPORTING
-                )
-                current_app.logger.info(
-                    f"create-nightly-notification-status-for-day task created "
-                    f"for {service_id}, {notification_type} and {process_day}"
-                )
+            create_nightly_notification_status_for_day.apply_async(
+                kwargs={
+                    'process_day': process_day.isoformat(),
+                    'notification_type': notification_type,
+                },
+                queue=QueueNames.REPORTING
+            )
+            current_app.logger.info(
+                f"create-nightly-notification-status-for-day task created "
+                f"for {notification_type} and {process_day}"
+            )


-@notify_celery.task(name="create-nightly-notification-status-for-service-and-day")
-def create_nightly_notification_status_for_service_and_day(process_day, service_id, notification_type):
+@notify_celery.task(name="create-nightly-notification-status-for-day")
+def create_nightly_notification_status_for_day(process_day, notification_type):
    process_day = datetime.strptime(process_day, "%Y-%m-%d").date()
    current_app.logger.info(
        f'create-nightly-notification-status-for-day task started '
-        f'for {service_id}, {notification_type} for {process_day}'
+        f'for {notification_type} for {process_day}'
    )

    start = datetime.utcnow()
-    new_status_rows = fetch_status_data_for_service_and_day(
-        process_day=process_day,
-        notification_type=notification_type,
-        service_id=service_id,
-    )
+    new_status_rows = []
+
+    for service in Service.query.all():
+        new_status_rows += fetch_status_data_for_service_and_day(
+            process_day=process_day,
+            notification_type=notification_type,
+            service_id=service.id,
+        )

    end = datetime.utcnow()
    current_app.logger.info(
        f'create-nightly-notification-status-for-day task fetch '
-        f'for {service_id}, {notification_type} for {process_day}: '
+        f'for {notification_type} for {process_day}: '
        f'data fetched in {(end - start).seconds} seconds'
    )

@@ -138,11 +139,10 @@ def create_nightly_notification_status_for_service_and_day(process_day, service_
        new_status_rows=new_status_rows,
        process_day=process_day,
        notification_type=notification_type,
-        service_id=service_id
    )

    current_app.logger.info(
        f'create-nightly-notification-status-for-day task finished '
-        f'for {service_id}, {notification_type} for {process_day}: '
+        f'for {notification_type} for {process_day}: '
        f'{len(new_status_rows)} rows updated'
    )