Skip to content

Commit

Permalink
Merge pull request #287 from gtnx/issue-286
Browse files Browse the repository at this point in the history
fix: Reuse pd.DataFrame index in _transform
  • Loading branch information
guillermo-navas-palencia committed Dec 6, 2023
2 parents 4d915ea + 9bccf9c commit 2477d5c
Show file tree
Hide file tree
Showing 2 changed files with 8 additions and 1 deletion.
2 changes: 1 addition & 1 deletion optbinning/binning/binning_process.py
Original file line number Diff line number Diff line change
Expand Up @@ -1423,7 +1423,7 @@ def _transform(self, X, metric, metric_special, metric_missing,
X_transform[:, i] = optb.transform(**tparams)

if isinstance(X, pd.DataFrame):
return pd.DataFrame(X_transform, columns=selected_variables)
return pd.DataFrame(X_transform, columns=selected_variables, index=X.index)

return X_transform

Expand Down
7 changes: 7 additions & 0 deletions tests/test_binning_process.py
Original file line number Diff line number Diff line change
Expand Up @@ -580,3 +580,10 @@ def test_verbose():
with open("tests/results/test_binning_process_verbose.txt", "w") as f:
with redirect_stdout(f):
process.fit(X, y, check_input=True)


def test_dataframe_index():
process = BinningProcess(variable_names)
X_train = pd.DataFrame(X, columns=variable_names, index=[2 * i for i in range(len(X))])
X_transform = process.fit_transform(X_train, y, metric="indices")
pd.testing.assert_index_equal(X_train.index, X_transform.index)

0 comments on commit 2477d5c

Please sign in to comment.