Refactor

2025-07-21 18:25:58 +02:00 · 2024-06-07 14:26:04 -06:00 · 2024-06-07 14:26:04 -06:00 · 34a9497372
commit 34a9497372
parent cafce7c54b
2 changed files with 187 additions and 197 deletions
--- a/src/registrar/models/utility/generic_helper.py
+++ b/src/registrar/models/utility/generic_helper.py
@ -298,3 +298,27 @@ def replace_url_queryparams(url_to_modify: str, query_params, convert_list_to_cs
    new_url = urlunparse(url_parts)
    return new_url
@staticmethod
 def convert_queryset_to_dict(queryset, is_model=True, key="id"):
    """
    Transforms a queryset into a dictionary keyed by a specified key (like "id").
    Parameters:
        requests (QuerySet or list of dicts): Input data.
        is_model (bool): Indicates if each item in 'queryset' are model instances (True) or dictionaries (False).
        key (str): Key or attribute to use for the resulting dictionary's keys.
    Returns:
        dict: Dictionary with keys derived from 'key' and values corresponding to items in 'queryset'.
    """
    if is_model:
        request_dict = {getattr(value, key): value for value in queryset}
    else:
        # Querysets sometimes contain sets of dictionaries.
        # Calling .values is an example of this.
        request_dict = {value[key]: value for value in queryset}
    return request_dict
--- a/src/registrar/utility/csv_export.py
+++ b/src/registrar/utility/csv_export.py
@ -14,6 +14,7 @@ from django.utils import timezone
 from django.core.paginator import Paginator
 from django.db.models.functions import Concat, Coalesce
 from django.contrib.postgres.aggregates import StringAgg
 from registrar.models.utility.generic_helper import convert_queryset_to_dict
 from registrar.templatetags.custom_filters import get_region
 from registrar.utility.enums import DefaultEmail
@ -713,6 +714,9 @@ class DomainRequestExport:
    Purely organizational -- all functions are independent.
    """
    # Get all the field names of the DomainRequest object
    domain_request_fields = set(field.name for field in DomainRequest._meta.get_fields())
    all_columns = [
        "Domain request",
        "Submitted at",
@ -743,111 +747,8 @@ class DomainRequestExport:
        "Investigator",
    ]
-    @staticmethod
+    @classmethod
-    def write_csv_for_requests(
+    def export_data_requests_growth_to_csv(cls, csv_file, start_date, end_date):
        writer,
        columns,
        requests,
        requests_with_extra_fields=None,
        should_write_header=True,
    ):
        """Receives params from the parent methods and outputs a CSV with filtered and sorted requests.
        Works with write_header as long as the same writer object is passed."""
        # Reduce the memory overhead when performing the write operation
        paginator = Paginator(requests, 1000)
        total_body_rows = []
        for page_num in paginator.page_range:
            page = paginator.page(page_num)
            rows = []
            for request in page.object_list:
                try:
                    extra = requests_with_extra_fields.get(request.id) if requests_with_extra_fields else {}
                    row = DomainRequestExport.parse_row_for_requests(columns, request, extra)
                    rows.append(row)
                except ValueError as err:
                    logger.error(f"csv_export -> Error when parsing row: {err}")
                    continue
            total_body_rows.extend(rows)
        if should_write_header:
            write_header(writer, columns)
        writer.writerows(total_body_rows)
    @staticmethod
    def parse_row_for_requests(columns, request: DomainRequest, extra_fields: dict):
        """
        Given a set of columns and a request dictionary,
        generate a new row from cleaned column data
        """
        # Handle the domain_type field. Defaults to the wrong format.
        org_type = request.organization_type
        if org_type and extra_fields.get("domain_type") is None:
            readable_org_type = DomainRequest.OrganizationChoices.get_org_label(org_type)
            extra_fields["domain_type"] = readable_org_type
        # Handle the federal_type field. Defaults to the wrong format.
        federal_type = request.federal_type
        if federal_type and extra_fields.get("human_readable_federal_type") is None:
            extra_fields["human_readable_federal_type"] = DomainRequest.BranchChoices.get_branch_label(federal_type)
        # Handle the status field. Defaults to the wrong format.
        status = request.status
        if status and extra_fields.get("status_display") is None:
            extra_fields["status_display"] = DomainRequest.DomainRequestStatus.get_status_label(status)
        # Handle the region field.
        state_territory = request.state_territory
        if state_territory and extra_fields.get("region") is None:
            extra_fields["region"] = get_region(state_territory)
        human_readable_election_board = "N/A"
        if request.is_election_board is not None:
            human_readable_election_board = "Yes" if request.is_election_board else "No"
        requested_domain = request.requested_domain
        if extra_fields.get("requested_domain_name") is None:
            extra_fields["requested_domain_name"] = getattr(requested_domain, "name", "No requested domain")
        # create a dictionary of fields which can be included in output.
        # "extra_fields" are precomputed fields (generated in the DB or parsed).
        FIELDS = {
            "Domain request": extra_fields.get("requested_domain_name"),
            "Status": extra_fields.get("status_display"),
            "Domain type": extra_fields.get("domain_type"),
            "Federal type": extra_fields.get("human_readable_federal_type"),
            "Region": extra_fields.get("region"),
            "Creator approved domains count": extra_fields.get("creator_approved_domains_count", 0),
            "Creator active requests count": extra_fields.get("creator_active_requests_count", 0),
            "Alternative domains": extra_fields.get("all_alternative_domains"),
            "Request additional details": extra_fields.get("additional_details"),
            "Other contacts": extra_fields.get("all_other_contacts"),
            "Current websites": extra_fields.get("all_current_websites"),
            # Normal fields
            "Federal agency": request.federal_agency.agency if request.federal_agency else None,
            "AO first name": request.authorizing_official.first_name,
            "AO last name": request.authorizing_official.last_name,
            "AO email": request.authorizing_official.email,
            "AO title/role": request.authorizing_official.title,
            "Creator first name": request.creator.first_name,
            "Creator last name": request.creator.last_name,
            "Creator email": request.creator.email,
            "Organization name": request.organization_name,
            "Election office": human_readable_election_board,
            "City": request.city,
            "State/territory": request.state_territory,
            "Request purpose": request.purpose,
            "CISA regional representative": request.cisa_representative_email,
            "Investigator": request.investigator.email if request.investigator else None,
            "Submitted at": request.submission_date,
        }
        row = [FIELDS.get(column, "") for column in columns]
        return row
    @staticmethod
    def export_data_requests_growth_to_csv(csv_file, start_date, end_date):
        """
        Growth report:
        Receive start and end dates from the view, parse them.
@ -876,33 +777,27 @@ class DomainRequestExport:
        all_requests = DomainRequest.objects.filter(**filter_condition).order_by(*sort_fields).distinct()
-        # Convert the request to a querystring. Only grab what we need.
+        annotated_requests = cls.annotate_and_retrieve_fields(all_requests, {"requested_domain__name"})
-        values_to_return = ["id", "generic_org_type", "federal_type", "submission_date"]
+        requests_dict = convert_queryset_to_dict(annotated_requests, is_model=False)
        extra_values = DomainRequestExport.annotate_request_and_return_values(all_requests, {}, values_to_return)
        # Override the default value for domain_type
        for request in extra_values.values():
            # Handle the domain_type field. Defaults to the wrong variant.
            org_type = request.get("generic_org_type")
            federal_type = request.get("federal_type")
            request["domain_type"] = None
            if org_type:
                readable_org_type = DomainRequest.OrganizationChoices.get_org_label(org_type)
                if federal_type:
                    readable_federal_type = DomainRequest.BranchChoices.get_branch_label(federal_type)
                    request["domain_type"] = f"{readable_org_type} - {readable_federal_type}"
                else:
                    request["domain_type"] = readable_org_type
        DomainRequestExport.write_csv_for_requests(writer, columns, all_requests, extra_values, should_write_header=True)
        cls.write_csv_for_requests(writer, columns, requests_dict)
    @classmethod
    def export_full_domain_request_report(cls, csv_file):
        writer = csv.writer(csv_file)
        requests = (
            DomainRequest.objects.select_related(
                "creator", "authorizing_official", "federal_agency", "investigator", "requested_domain"
            )
            .prefetch_related("current_websites", "other_contacts", "alternative_domains")
            .exclude(status__in=[DomainRequest.DomainRequestStatus.STARTED])
            .order_by("status","requested_domain__name",)
            .distinct()
        )
        # Annotations are custom columns returned to the queryset (AKA: computed in the DB)
        annotations = {
            "additional_details": DomainRequestExport.get_additional_details_query(),
            "creator_approved_domains_count": DomainRequestExport.get_creator_approved_domains_count_query(),
            "creator_active_requests_count": DomainRequestExport.get_creator_active_requests_count_query(),
            "all_other_contacts": DomainRequestExport.get_all_other_contacts_query(),
@ -910,95 +805,166 @@ class DomainRequestExport:
            "all_alternative_domains": StringAgg("alternative_domains__website", delimiter=" | ", distinct=True),
        }
-        values_to_return = [
+        # .values can't go two levels deep (just returns the id) - so we have to include this.
-            # Return out custom fields
+        additional_values = [
-            "all_alternative_domains",
+            "requested_domain__name",
-            "all_other_contacts",
+            "federal_agency__agency",
-            "all_current_websites",
+            "authorizing_official__first_name",
-            "additional_details",
+            "authorizing_official__last_name",
-            "creator_approved_domains_count",
+            "authorizing_official__email",
-            "creator_active_requests_count",
+            "authorizing_official__title",
            "creator__first_name",
            "creator__last_name",
            "creator__email",
            "investigator__email"
        ]
-        requests = (
+        # Convert the domain request queryset to a dictionary (including annotated fields)
-            DomainRequest.objects.select_related(
+        annotated_requests = cls.annotate_and_retrieve_fields(requests, annotations, additional_values)
-                "creator", "authorizing_official", "federal_agency", "investigator", "requested_domain"
+        requests_dict = convert_queryset_to_dict(annotated_requests, is_model=False)
            )
            .exclude(status__in=[DomainRequest.DomainRequestStatus.STARTED])
            .order_by("status","requested_domain__name",)
            .distinct()
        )
-        extra_values = DomainRequestExport.annotate_request_and_return_values(requests, annotations, values_to_return)
+        # Write the csv file
-        DomainRequestExport.write_csv_for_requests(writer, cls.all_columns, requests, extra_values, should_write_header=True)
+        cls.write_csv_for_requests(writer, cls.all_columns, requests_dict)
    @staticmethod
-    def annotate_request_and_return_values(requests, annotations, values_to_return, return_dict=True) -> QuerySet | dict:
+    def write_csv_for_requests(
        writer,
        columns,
        requests_dict,
        should_write_header=True,
    ):
        """Receives params from the parent methods and outputs a CSV with filtered and sorted requests.
        Works with write_header as long as the same writer object is passed."""
        rows = []
        for request in requests_dict.values():
            try:
                row = DomainRequestExport.parse_row_for_requests(columns, request)
                rows.append(row)
            except ValueError as err:
                logger.error(f"csv_export -> Error when parsing row: {err}")
                continue
        if should_write_header:
            write_header(writer, columns)
        writer.writerows(rows)
    @staticmethod
    def parse_row_for_requests(columns, request, show_expanded_org_type=False):
        """
-        Annotates a queryset with specified annotations and retrieves specified fields.
+        Given a set of columns and a request dictionary,
        generate a new row from cleaned column data
        """
        # FK fields
        federal_agency = "federal_agency"
        ao = "authorizing_official"
        creator = "creator"
        investigator = "investigator"
        # Handle the federal_type field. Defaults to the wrong format.
        federal_type = request.get("federal_type")
        human_readable_federal_type = DomainRequest.BranchChoices.get_branch_label(federal_type) if federal_type else None
        # Handle the org_type field. Either "Tribal" or "Federal - Executive".
        org_type = request.get("organization_type")
        human_readable_org_type = DomainRequest.OrganizationChoices.get_org_label(org_type) if org_type else None
        if human_readable_org_type and human_readable_federal_type and show_expanded_org_type:
            human_readable_org_type = f"{human_readable_org_type} - {human_readable_federal_type}"
        # Handle the status field. Defaults to the wrong format.
        status = request.get("status")
        status_display = DomainRequest.DomainRequestStatus.get_status_label(status) if status else None
        # Handle the region field.
        state_territory = request.get("state_territory")
        region = get_region(state_territory) if state_territory else None
        requested_domain = request.get("requested_domain__name")
        requested_domain_name = requested_domain if requested_domain else "No requested domain"
        # Handle the election field. N/A if None, "Yes"/"No" if boolean
        human_readable_election_board = "N/A"
        if request.get("is_election_board") is not None:
            human_readable_election_board = "Yes" if request.is_election_board else "No"
        # Handle the additional details field. Pipe seperated
        details = [request.get("cisa_representative_email"), request.get("anything_else")]
        additional_details = " | ".join([field for field in details if field is not None])
        # create a dictionary of fields which can be included in output.
        # "extra_fields" are precomputed fields (generated in the DB or parsed).
        FIELDS = {
            # Parsed fields - defined above.
            "Domain request": requested_domain_name,
            "Region": region,
            "Status": status_display,
            "Election office": human_readable_election_board,
            "Federal type": human_readable_federal_type,
            "Domain type": human_readable_org_type,
            "Request additional details": additional_details,
            # Annotated fields - passed into the request dict.
            "Creator approved domains count": request.get("creator_approved_domains_count", 0),
            "Creator active requests count": request.get("creator_active_requests_count", 0),
            "Alternative domains": request.get("all_alternative_domains"),
            "Other contacts": request.get("all_other_contacts"),
            "Current websites": request.get("all_current_websites"),
            # Untouched FK fields - passed into the request dict.
            "Federal agency": request.get(f"{federal_agency}__agency"),
            "AO first name": request.get(f"{ao}__first_name"),
            "AO last name": request.get(f"{ao}__last_name"),
            "AO email": request.get(f"{ao}__email"),
            "AO title/role": request.get(f"{ao}__title"),
            "Creator first name": request.get(f"{creator}__first_name"),
            "Creator last name": request.get(f"{creator}__last_name"),
            "Creator email": request.get(f"{creator}__email"),
            "Investigator": request.get(f"{investigator}__email"),
            # Untouched fields
            "Organization name": request.get("organization_name"),
            "City": request.get("city"),
            "State/territory": request.get("state_territory"),
            "Request purpose": request.get("purpose"),
            "CISA regional representative": request.get("cisa_representative_email"),
            "Submitted at": request.get("submission_date"),
        }
        row = [FIELDS.get(column, "") for column in columns]
        return row
    @classmethod
    def annotate_and_retrieve_fields(cls, requests, annotations, additional_values=None) -> QuerySet:
        """
        Applies annotations to a queryset and retrieves specified fields, 
        including class-defined and annotation-defined.
        Parameters:
-            requests (QuerySet): The initial queryset to which annotations will be applied.
+            requests (QuerySet): Initial queryset.
-            annotations (dict): A dictionary where keys are names of the new fields to create, and values are
+            annotations (dict, optional): Fields to compute {field_name: expression}.
-                                expressions that describe how to calculate these fields.
+            additional_values (list, optional): Extra fields to retrieve; defaults to annotation keys if None.
-            values_to_return (list): A list of strings that specify which fields should be included in the final
+
                                    output, in addition to the 'id' field which is included by default.
            return_dict (bool): If True, the method returns a dictionary where each key is an 'id' of an item
                                and each value is a dictionary of the fields specified in `values_to_return`.
                                If False, the method returns a QuerySet containing dictionaries of the requested fields.
        Returns:
-            QuerySet | dict: Depending on the value of `return_dict`, returns either a QuerySet or a dictionary.
+            QuerySet: Contains dictionaries with the specified fields for each record.
                            The QuerySet contains dictionaries for each record with the specified fields.
                            The dictionary contains keys as record ids and values as dictionaries of the specified fields.
        """
-        queryset = requests.annotate(**annotations).values("id", *values_to_return)
+        if annotations is None:
-        if return_dict:
+            annotations = {}
            requests_dict = {value["id"]: value for value in queryset}
            return requests_dict
        if additional_values is None:
            additional_values = []
        # We can infer that if we're passing in annotations,
        # we want to grab the result of said annotation.
        if annotations:
            additional_values.extend(annotations.keys())
        queryset = requests.annotate(**annotations).values(*cls.domain_request_fields, *additional_values)
        return queryset
    # ============================================================= #
    # Helper functions for django ORM queries.                      #
    # We are using these rather than pure python for speed reasons. #
    # ============================================================= #
    # AXE THIS
    @staticmethod
    def get_additional_details_query(default_message=None, delimiter=" | "):
        """
        A SQL case statement for DomainRequest.anything_else and DomainRequest.cisa_representative_email.
        When ran, returns a concatenation of anything_else and cisa_representative_email - seperated by " | ".
        Equivalent to:
        `f"{cisa_rep} | {anything_else}" If anything_else or cisa_rep else None`
        """
        # TODO this should be replaced with cisa_representative_first_name and cisa_representative_last_name
        additional_details_query = Case(
            When(
                cisa_representative_email__isnull=False,
                anything_else__isnull=False,
                then=Concat(F("cisa_representative_email"), Value(delimiter), F("anything_else")),
            ),
            When(
                cisa_representative_email__isnull=True,
                anything_else__isnull=False,
                then=F("anything_else"),
            ),
            When(
                cisa_representative_email__isnull=False,
                anything_else__isnull=True,
                then=F("cisa_representative_email"),
            ),
            default=Value(default_message),
            output_field=CharField(),
        )
        return additional_details_query
    @staticmethod
    def get_all_other_contacts_query(delimiter=" | "):