Skip to content

Commit

Permalink
Merge pull request #277 from alexliap/read_save_bins
Browse files Browse the repository at this point in the history
Read/save bins Issue #96
  • Loading branch information
guillermo-navas-palencia committed Jan 9, 2024
2 parents 1ca485e + cabcdf8 commit 1a74eb5
Show file tree
Hide file tree
Showing 3 changed files with 167 additions and 0 deletions.
56 changes: 56 additions & 0 deletions optbinning/binning/binning.py
Original file line number Diff line number Diff line change
Expand Up @@ -12,6 +12,8 @@

from sklearn.utils import check_array

import json

from ..information import solver_statistics
from ..logging import Logger
from .auto_monotonic import auto_monotonic
Expand Down Expand Up @@ -1174,3 +1176,57 @@ def status(self):
self._check_is_fitted()

return self._status

def to_json(self, path: str):
"""
Save optimal bins and/or splits points and transformation depending on the target type.
Parameters
----------
path: The path where the json is going to be saved
"""
if path is None:
raise ValueError('Specify the path for the json file')

table = self.binning_table

opt_bin_dict=dict()
opt_bin_dict['name'] = table.name
opt_bin_dict['dtype'] = table.dtype
opt_bin_dict['special_codes'] = table.special_codes

if table.dtype == 'numerical':
opt_bin_dict['splits'] = table.splits.tolist()
elif table.dtype == 'categorical':
opt_bin_dict['splits'] = [split.tolist() for split in table.splits]

opt_bin_dict['n_nonevent'] = table.n_nonevent.tolist()
opt_bin_dict['n_event'] = table.n_event.tolist()

opt_bin_dict['min_x'] = table.min_x
opt_bin_dict['max_x'] = table.max_x
opt_bin_dict['categories'] = table.categories
opt_bin_dict['cat_others'] = table.cat_others
opt_bin_dict['user_splits'] = table.user_splits

with open(path, "w") as write_file:
json.dump(opt_bin_dict, write_file)

def read_json(self, path: str):
"""
Read json file containing split points and set them as the new split points.
Parameters
----------
path: The path of the json file.
"""
self._is_fitted = True

with open(path, "r") as read_file:
bin_table_attr = json.load(read_file)

for key in bin_table_attr.keys():
if isinstance(bin_table_attr[key], list):
bin_table_attr[key] = np.array(bin_table_attr[key])

self._binning_table = BinningTable(**bin_table_attr)
62 changes: 62 additions & 0 deletions optbinning/binning/continuous_binning.py
Original file line number Diff line number Diff line change
Expand Up @@ -7,6 +7,7 @@

import numbers
import time
import json

from sklearn.utils import check_array

Expand Down Expand Up @@ -977,3 +978,64 @@ def binning_table(self):
self._check_is_fitted()

return self._binning_table

def to_json(self, path: str):
"""
Save optimal bins and/or splits points and transformation depending on the target type.
Parameters
----------
path: The path where the json is going to be saved
"""
if path is None:
raise ValueError('Specify the path for the json file.')

table = self.binning_table

opt_bin_dict=dict()
opt_bin_dict['name'] = table.name
opt_bin_dict['dtype'] = table.dtype
opt_bin_dict['special_codes'] = table.special_codes

if table.dtype == 'numerical':
opt_bin_dict['splits'] = table.splits.tolist()
elif table.dtype == 'categorical':
opt_bin_dict['splits'] = [split.tolist() for split in table.splits]

opt_bin_dict['n_records'] = table.n_records.tolist()
opt_bin_dict['sums'] = table.sums.tolist()
opt_bin_dict['stds'] = table.stds.tolist()
opt_bin_dict['min_target'] = table.min_target.tolist()
opt_bin_dict['max_target'] = table.max_target.tolist()
opt_bin_dict['n_zeros'] = table.n_zeros.tolist()

opt_bin_dict['min_x'] = table.min_x
opt_bin_dict['max_x'] = table.max_x
opt_bin_dict['categories'] = table.categories
opt_bin_dict['cat_others'] = table.cat_others
opt_bin_dict['user_splits'] = table.user_splits

with open(path, "w") as write_file:
json.dump(opt_bin_dict, write_file)

def read_json(self, path: str):
"""
Read json file containing split points and set them as the new split points.
Parameters
----------
path: The path of the json file.
"""
if path is None:
raise ValueError('Specify the path for the json file.')

self._is_fitted = True

with open(path, "r") as read_file:
cont_table_attr = json.load(read_file)

for key in cont_table_attr.keys():
if isinstance(cont_table_attr[key], list):
cont_table_attr[key] = np.array(cont_table_attr[key])

self._binning_table = ContinuousBinningTable(**cont_table_attr)
49 changes: 49 additions & 0 deletions optbinning/binning/multiclass_binning.py
Original file line number Diff line number Diff line change
Expand Up @@ -7,6 +7,7 @@

import numbers
import time
import json

import numpy as np

Expand Down Expand Up @@ -873,3 +874,51 @@ def splits(self):
self._check_is_fitted()

return self._splits_optimal

def to_json(self, path: str):
"""
Save optimal bins and/or splits points and transformation depending on the target type.
Parameters
----------
path: The path where the json is going to be saved
"""
if path is None:
raise ValueError('Specify the path for the json file.')

table = self.binning_table

opt_bin_dict=dict()
opt_bin_dict['name'] = table.name
opt_bin_dict['special_codes'] = table.special_codes

opt_bin_dict['splits'] = table.splits.tolist()

opt_bin_dict['n_event'] = table.n_event.tolist()

opt_bin_dict['classes'] = table.classes.tolist()

with open(path, "w") as write_file:
json.dump(opt_bin_dict, write_file)

def read_json(self, path: str):
"""
Read json file containing split points and set them as the new split points.
Parameters
----------
path: The path of the json file.
"""
if path is None:
raise ValueError('Specify the path for the json file.')

self._is_fitted = True

with open(path, "r") as read_file:
multi_table_attr = json.load(read_file)

for key in multi_table_attr.keys():
if isinstance(multi_table_attr[key], list):
multi_table_attr[key] = np.array(multi_table_attr[key])

self._binning_table = MulticlassBinningTable(**multi_table_attr)

0 comments on commit 1a74eb5

Please sign in to comment.