We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent ada39ea commit 378125eCopy full SHA for 378125e
hlink/linking/core/transforms.py
@@ -336,6 +336,16 @@ def generate_transforms(
336
is_a: bool,
337
id_col: str,
338
) -> DataFrame:
339
+ """Generate feature selection columns and return the input dataframe with these new columns attached.
340
+
341
+ Args:
342
+ spark: the Spark session
343
+ df_selected: the input Spark DataFrame
344
+ feature_selections: a list of feature selections to compute
345
+ link_task: the current LinkTask
346
+ is_a: whether this is dataset A (True) or dataset B (False)
347
+ id_col: the name of the identifier column in the input data frame
348
+ """
349
not_skipped_feature_selections = [
350
c
351
for c in feature_selections
0 commit comments