rg_mtrx = [
[0, 0, 0], ## under-sample ("majority")
[1, 1, 0], ## over-sample ("minority")
[2, 1, 0], ## over-sample ("minority")
[3, 1, 0], ## over-sample ("minority")
]
## conduct smogn
balanced_smogn = smogn.smoter(
## main arguments
data = df, ## pandas dataframe
y = 'Room_Occupancy_Count', ## string ('header name')
k = 5, ## positive integer (k < n)
pert = 0.02, ## real number (0 < R < 1)
samp_method = 'extreme', ## string ('balance' or 'extreme')
drop_na_col = False, ## boolean (True or False)
drop_na_row = False, ## boolean (True or False)
replace = True, ## boolean (True or False)
## phi relevance arguments
rel_thres = 0.50, ## real number (0 < R < 1)
rel_method = 'manual', ## string ('auto' or 'manual')
# rel_xtrm_type = 'both', ## unused (rel_method = 'manual')
# rel_coef = 1.50, ## unused (rel_method = 'manual')
rel_ctrl_pts_rg = rg_mtrx ## 2d array (format: [x, y])
)