We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 5d41c48 commit 5e5e3c8Copy full SHA for 5e5e3c8
1 file changed
sdmetrics/column_pairs/statistical/contingency_similarity.py
@@ -117,7 +117,9 @@ def compute_breakdown(
117
contingency_synthetic = synthetic.groupby(list(columns), dropna=False).size() / len(
118
synthetic
119
)
120
- combined_index = contingency_real.index.union(contingency_synthetic.index, sort=False)
+ combined_index = contingency_real.index.union(
121
+ contingency_synthetic.index, sort=False
122
+ ).drop_duplicates()
123
contingency_synthetic = contingency_synthetic.reindex(combined_index, fill_value=0)
124
contingency_real = contingency_real.reindex(combined_index, fill_value=0)
125
diff = abs(contingency_real - contingency_synthetic).fillna(0)
0 commit comments