Skip to content

Commit

Permalink
Merge branch 'develop' into 3328-vul-audit
Browse files Browse the repository at this point in the history
  • Loading branch information
raftmsohani authored Jan 8, 2025
2 parents 9f39404 + d326e59 commit cde7eb3
Show file tree
Hide file tree
Showing 2 changed files with 61 additions and 21 deletions.
76 changes: 57 additions & 19 deletions tdrs-backend/tdpservice/data_files/util.py
Original file line number Diff line number Diff line change
Expand Up @@ -21,7 +21,7 @@ class ParserErrorCategoryChoices(models.TextChoices):
HISTORICAL_CONSISTENCY = "6", _("Historical consistency")


def get_prioritized_queryset(parser_errors):
def get_prioritized_queryset(parser_errors, is_s3_s4):
"""Generate a prioritized queryset of ParserErrors."""
PRIORITIZED_CAT2 = (
("FAMILY_AFFILIATION", "CITIZENSHIP_STATUS", "CLOSURE_REASON"),
Expand All @@ -42,6 +42,15 @@ def get_prioritized_queryset(parser_errors):
Q(error_type=ParserErrorCategoryChoices.CASE_CONSISTENCY)
filtered_errors = parser_errors.filter(error_type_query)

# If we are a Aggregate or Stratum file, we want all cat2 and cat3 errors.
if is_s3_s4:
all_cat2_cat3 = Q(error_type=ParserErrorCategoryChoices.FIELD_VALUE) | \
Q(error_type=ParserErrorCategoryChoices.VALUE_CONSISTENCY)
filtered_errors = filtered_errors.union(parser_errors.filter(all_cat2_cat3).exclude(
error_message__contains="HEADER Update Indicator")
)
return filtered_errors

for fields in PRIORITIZED_CAT2:
filtered_errors = filtered_errors.union(parser_errors.filter(
field_name__in=fields,
Expand Down Expand Up @@ -121,36 +130,65 @@ def format_header(header_list: list):
return ' '.join([i.capitalize() for i in header_list.split('_')])


def write_prioritized_errors(worksheet, prioritized_errors, bold):
"""Write prioritized errors to spreadsheet."""
row, col = 5, 0

# We will write the headers in the first row
def active_closed_generator(record, rpt_month_year, fields_json):
"""Generate error report row for S1/S2 files."""
return (record.case_number,
rpt_month_year[:4],
calendar.month_name[int(rpt_month_year[4:])] if rpt_month_year[4:] else None,
format_error_msg(record.error_message, fields_json),
record.item_number,
friendly_names(fields_json),
internal_names(fields_json),
record.row_number,
str(ParserErrorCategoryChoices(record.error_type).label))


def aggregate_stratum_generator(record, rpt_month_year, fields_json):
"""Generate error report row for S3/S4 files."""
return (rpt_month_year[:4],
calendar.month_name[int(rpt_month_year[4:])] if rpt_month_year[4:] else None,
format_error_msg(record.error_message, fields_json),
record.item_number,
friendly_names(fields_json),
internal_names(fields_json),
record.row_number,
str(ParserErrorCategoryChoices(record.error_type).label))


def get_row_generator(is_s3_s4):
"""Get the correct row generator."""
if is_s3_s4:
return aggregate_stratum_generator
return active_closed_generator


def get_sheet_columns(is_s3_s4):
"""Get the correct columns based on file section."""
columns = ['case_number', 'year', 'month',
'error_message', 'item_number', 'item_name',
'internal_variable_name', 'row_number', 'error_type',
]
columns = columns[1:] if is_s3_s4 else columns
return columns


def write_prioritized_errors(worksheet, prioritized_errors, bold, is_s3_s4):
"""Write prioritized errors to spreadsheet."""
# We will write the headers in the first row, remove case_number if we are s3/s4
columns = get_sheet_columns(is_s3_s4)
for idx, col in enumerate(columns):
worksheet.write(row, idx, format_header(col), bold)
worksheet.write(5, idx, format_header(col), bold)

row_generator = get_row_generator(is_s3_s4)
paginator = Paginator(prioritized_errors.order_by('pk'), settings.BULK_CREATE_BATCH_SIZE)
row_idx = 6
for page in paginator:
for record in page.object_list:
rpt_month_year = getattr(record, 'rpt_month_year', None)
rpt_month_year = str(rpt_month_year) if rpt_month_year else ""

fields_json = check_fields_json(getattr(record, 'fields_json', {}), record.field_name)

worksheet.write(row_idx, 0, record.case_number)
worksheet.write(row_idx, 1, rpt_month_year[:4])
worksheet.write(row_idx, 2, calendar.month_name[int(rpt_month_year[4:])] if rpt_month_year[4:] else None)
worksheet.write(row_idx, 3, format_error_msg(record.error_message, fields_json))
worksheet.write(row_idx, 4, record.item_number)
worksheet.write(row_idx, 5, friendly_names(fields_json))
worksheet.write(row_idx, 6, internal_names(fields_json))
worksheet.write(row_idx, 7, record.row_number)
worksheet.write(row_idx, 8, str(ParserErrorCategoryChoices(record.error_type).label))
worksheet.write_row(row_idx, 0, row_generator(record, rpt_month_year, fields_json))
row_idx += 1


Expand Down Expand Up @@ -189,7 +227,7 @@ def write_aggregate_errors(worksheet, all_errors, bold):
row_idx += 1


def get_xls_serialized_file(all_errors, prioritized_errors):
def get_xls_serialized_file(all_errors, prioritized_errors, is_s3_s4):
"""Return xls file created from the error."""
output = BytesIO()
workbook = xlsxwriter.Workbook(output)
Expand All @@ -200,7 +238,7 @@ def get_xls_serialized_file(all_errors, prioritized_errors):
write_worksheet_banner(aggregate_sheet)

bold = workbook.add_format({'bold': True})
write_prioritized_errors(prioritized_sheet, prioritized_errors, bold)
write_prioritized_errors(prioritized_sheet, prioritized_errors, bold, is_s3_s4)
write_aggregate_errors(aggregate_sheet, all_errors, bold)

# autofit all columns except for the first one
Expand Down
6 changes: 4 additions & 2 deletions tdrs-backend/tdpservice/data_files/views.py
Original file line number Diff line number Diff line change
Expand Up @@ -147,9 +147,11 @@ def download_error_report(self, request, pk=None):
"""Generate and return the parsing error report xlsx."""
datafile = self.get_object()
all_errors = ParserError.objects.filter(file=datafile)
filtered_errors = get_prioritized_queryset(all_errors)
is_s3_s4 = (DataFile.Section.AGGREGATE_DATA in datafile.section or
DataFile.Section.STRATUM_DATA in datafile.section)
filtered_errors = get_prioritized_queryset(all_errors, is_s3_s4)

return Response(get_xls_serialized_file(all_errors, filtered_errors))
return Response(get_xls_serialized_file(all_errors, filtered_errors, is_s3_s4))


class GetYearList(APIView):
Expand Down

0 comments on commit cde7eb3

Please sign in to comment.