mirror of
https://github.com/GSA/notifications-api.git
synced 2026-02-02 17:31:14 -05:00
Group letters into a max number of files for sending to DVLA
Grouping the letters into a maximum number of files is necessary because the SQS task needs to be under a certain size. We also compress the task when sending.
This commit is contained in:
@@ -98,7 +98,8 @@ def collate_letter_pdfs_for_day(date):
|
|||||||
notify_celery.send_task(
|
notify_celery.send_task(
|
||||||
name=TaskNames.ZIP_AND_SEND_LETTER_PDFS,
|
name=TaskNames.ZIP_AND_SEND_LETTER_PDFS,
|
||||||
kwargs={'filenames_to_zip': filenames},
|
kwargs={'filenames_to_zip': filenames},
|
||||||
queue=QueueNames.PROCESS_FTP
|
queue=QueueNames.PROCESS_FTP,
|
||||||
|
compression='zlib'
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|
||||||
@@ -112,7 +113,10 @@ def group_letters(letter_pdfs):
|
|||||||
list_of_files = []
|
list_of_files = []
|
||||||
for letter in letter_pdfs:
|
for letter in letter_pdfs:
|
||||||
if letter['Key'].lower().endswith('.pdf'):
|
if letter['Key'].lower().endswith('.pdf'):
|
||||||
if running_filesize + letter['Size'] > current_app.config['MAX_LETTER_PDF_ZIP_FILESIZE']:
|
if (
|
||||||
|
running_filesize + letter['Size'] > current_app.config['MAX_LETTER_PDF_ZIP_FILESIZE'] or
|
||||||
|
len(list_of_files) >= current_app.config['MAX_LETTER_PDF_COUNT_PER_ZIP']
|
||||||
|
):
|
||||||
yield list_of_files
|
yield list_of_files
|
||||||
running_filesize = 0
|
running_filesize = 0
|
||||||
list_of_files = []
|
list_of_files = []
|
||||||
|
|||||||
@@ -129,6 +129,7 @@ class Config(object):
|
|||||||
MAX_VERIFY_CODE_COUNT = 10
|
MAX_VERIFY_CODE_COUNT = 10
|
||||||
|
|
||||||
MAX_LETTER_PDF_ZIP_FILESIZE = 500 * 1024 * 1024 # 500mb
|
MAX_LETTER_PDF_ZIP_FILESIZE = 500 * 1024 * 1024 # 500mb
|
||||||
|
MAX_LETTER_PDF_COUNT_PER_ZIP = 5000
|
||||||
|
|
||||||
CHECK_PROXY_HEADER = False
|
CHECK_PROXY_HEADER = False
|
||||||
|
|
||||||
|
|||||||
@@ -155,16 +155,18 @@ def test_collate_letter_pdfs_for_day(notify_api, mocker):
|
|||||||
assert mock_celery.call_args_list[0] == call(
|
assert mock_celery.call_args_list[0] == call(
|
||||||
name='zip-and-send-letter-pdfs',
|
name='zip-and-send-letter-pdfs',
|
||||||
kwargs={'filenames_to_zip': ['A.PDF', 'B.pDf']},
|
kwargs={'filenames_to_zip': ['A.PDF', 'B.pDf']},
|
||||||
queue='process-ftp-tasks'
|
queue='process-ftp-tasks',
|
||||||
|
compression='zlib'
|
||||||
)
|
)
|
||||||
assert mock_celery.call_args_list[1] == call(
|
assert mock_celery.call_args_list[1] == call(
|
||||||
name='zip-and-send-letter-pdfs',
|
name='zip-and-send-letter-pdfs',
|
||||||
kwargs={'filenames_to_zip': ['C.pdf']},
|
kwargs={'filenames_to_zip': ['C.pdf']},
|
||||||
queue='process-ftp-tasks'
|
queue='process-ftp-tasks',
|
||||||
|
compression='zlib'
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|
||||||
def test_group_letters(notify_api):
|
def test_group_letters_splits_on_file_size(notify_api):
|
||||||
letters = [
|
letters = [
|
||||||
# ends under max but next one is too big
|
# ends under max but next one is too big
|
||||||
{'Key': 'A.pdf', 'Size': 1}, {'Key': 'B.pdf', 'Size': 2},
|
{'Key': 'A.pdf', 'Size': 1}, {'Key': 'B.pdf', 'Size': 2},
|
||||||
@@ -190,6 +192,29 @@ def test_group_letters(notify_api):
|
|||||||
assert next(x, None) is None
|
assert next(x, None) is None
|
||||||
|
|
||||||
|
|
||||||
|
def test_group_letters_splits_on_file_count(notify_api):
|
||||||
|
letters = [
|
||||||
|
{'Key': 'A.pdf', 'Size': 1},
|
||||||
|
{'Key': 'B.pdf', 'Size': 2},
|
||||||
|
{'Key': 'C.pdf', 'Size': 3},
|
||||||
|
{'Key': 'D.pdf', 'Size': 1},
|
||||||
|
{'Key': 'E.pdf', 'Size': 1},
|
||||||
|
{'Key': 'F.pdf', 'Size': 5},
|
||||||
|
{'Key': 'G.pdf', 'Size': 6},
|
||||||
|
{'Key': 'H.pdf', 'Size': 1},
|
||||||
|
{'Key': 'I.pdf', 'Size': 1},
|
||||||
|
]
|
||||||
|
|
||||||
|
with set_config_values(notify_api, {'MAX_LETTER_PDF_COUNT_PER_ZIP': 3}):
|
||||||
|
x = group_letters(letters)
|
||||||
|
|
||||||
|
assert next(x) == [{'Key': 'A.pdf', 'Size': 1}, {'Key': 'B.pdf', 'Size': 2}, {'Key': 'C.pdf', 'Size': 3}]
|
||||||
|
assert next(x) == [{'Key': 'D.pdf', 'Size': 1}, {'Key': 'E.pdf', 'Size': 1}, {'Key': 'F.pdf', 'Size': 5}]
|
||||||
|
assert next(x) == [{'Key': 'G.pdf', 'Size': 6}, {'Key': 'H.pdf', 'Size': 1}, {'Key': 'I.pdf', 'Size': 1}]
|
||||||
|
# make sure iterator is exhausted
|
||||||
|
assert next(x, None) is None
|
||||||
|
|
||||||
|
|
||||||
def test_group_letters_ignores_non_pdfs(notify_api):
|
def test_group_letters_ignores_non_pdfs(notify_api):
|
||||||
letters = [{'Key': 'A.zip'}]
|
letters = [{'Key': 'A.zip'}]
|
||||||
assert list(group_letters(letters)) == []
|
assert list(group_letters(letters)) == []
|
||||||
|
|||||||
Reference in New Issue
Block a user