diff --git a/koku/masu/processor/tasks.py b/koku/masu/processor/tasks.py index 61cd1db79b..72049083e7 100644 --- a/koku/masu/processor/tasks.py +++ b/koku/masu/processor/tasks.py @@ -318,10 +318,15 @@ def summarize_reports( # noqa: C901 """ reports_by_source = defaultdict(list) + schema_name = None for report in reports_to_summarize: if report: reports_by_source[report.get("provider_uuid")].append(report) + if schema_name is None: + # Only set the schema name once + schema_name = report.get("schema_name") + reports_deduplicated = [] dedup_func_map = { Provider.PROVIDER_GCP: deduplicate_reports_for_gcp, @@ -329,7 +334,12 @@ def summarize_reports( # noqa: C901 Provider.PROVIDER_OCI: deduplicate_reports_for_oci, Provider.PROVIDER_OCI_LOCAL: deduplicate_reports_for_oci, } - LOG.info(log_json("summarize_reports", msg="deduplicating reports")) + + kwargs = {} + if schema_name: + kwargs["schema_name"] = schema_name + + LOG.info(log_json("summarize_reports", msg="deduplicating reports", **kwargs)) for report_list in reports_by_source.values(): if report and report.get("provider_type") in dedup_func_map: provider_type = report.get("provider_type") @@ -357,7 +367,13 @@ def summarize_reports( # noqa: C901 } ) - LOG.info(log_json("summarize_reports", msg=f"deduplicated reports, num report: {len(reports_deduplicated)}")) + LOG.info( + log_json( + "summarize_reports", + msg=f"deduplicated reports, num report: {len(reports_deduplicated)}", + **kwargs, + ) + ) for report in reports_deduplicated: # For day-to-day summarization we choose a small window to # cover new data from a window of days.