Improve efficiency of process missing rows task

For every missing row this was: - downloading the CSV file from S3 - looping through every row in it until it found the one matching the index of the missing row `RecipientCSV` implements `__getitem__`[1] (which maybe it didn’t before) so we can create it once, then index the relevant row directly. *** 1. 5ae0572d41/notifications_utils/recipients.py (L78-L79)
2026-02-01 15:46:07 -05:00 · 2020-09-26 10:57:21 +01:00
parent 2af62bdd1f
commit 9ad33045dd
1 changed files with 5 additions and 6 deletions
--- a/app/celery/scheduled_tasks.py
+++ b/app/celery/scheduled_tasks.py
@@ -237,14 +237,13 @@ def check_for_missing_rows_in_completed_jobs():
    jobs_and_job_size = find_jobs_with_missing_rows()
    for x in jobs_and_job_size:
        job = x[1]
+        recipient_csv, template, sender_id = get_recipient_csv_and_template_and_sender_id(job)
        missing_rows = find_missing_row_for_job(job.id, job.notification_count)
        for row_to_process in missing_rows:
-            recipient_csv, template, sender_id = get_recipient_csv_and_template_and_sender_id(job)
-            for row in recipient_csv.get_rows():
-                if row.index == row_to_process.missing_row:
-                    current_app.logger.info(
-                        "Processing missing row: {} for job: {}".format(row_to_process.missing_row, job.id))
-                    process_row(row, template, job, job.service, sender_id=sender_id)
+            row = recipient_csv[row_to_process.missing_row]
+            current_app.logger.info(
+                "Processing missing row: {} for job: {}".format(row_to_process.missing_row, job.id))
+            process_row(row, template, job, job.service, sender_id=sender_id)


@notify_celery.task(name='check-for-services-with-high-failure-rates-or-sending-to-tv-numbers')