Skip to content

Commit 6dc4dd2

Browse files
committedMay 23, 2024
remove intermediate df
1 parent ab1a97b commit 6dc4dd2

File tree

1 file changed

+5
-2
lines changed
  • statistical_methods_library/imputation

1 file changed

+5
-2
lines changed
 

‎statistical_methods_library/imputation/engine.py

+5-2
Original file line numberDiff line numberDiff line change
@@ -579,7 +579,6 @@ def calculate_weighted_link(link_name):
579579
if manual_construction_col:
580580
# populate link, count, default information
581581
# for manual_construction data
582-
unique_grp_prd = prepared_df.dropDuplicates(["period", "grouping"])
583582
# Get the required additional output columns
584583
mc_cols = manual_construction_df.columns
585584
mc_additional_cols = []
@@ -592,7 +591,11 @@ def calculate_weighted_link(link_name):
592591
mc_additional_cols.append(key)
593592
manual_construction_df = (
594593
manual_construction_df.alias("mc")
595-
.join(unique_grp_prd, ["period", "grouping"], "leftouter")
594+
.join(
595+
prepared_df.dropDuplicates(["period", "grouping"]),
596+
["period", "grouping"],
597+
"leftouter",
598+
)
596599
.select(
597600
*(f"mc.{name}" for name in mc_cols),
598601
*mc_additional_cols,

0 commit comments

Comments
 (0)