Skip to content

Commit 73e110d

Browse files
committed
refactoring
1 parent 6d0aed6 commit 73e110d

File tree

5 files changed

+22
-23
lines changed

5 files changed

+22
-23
lines changed

crep/base.py

Lines changed: 14 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -1438,8 +1438,8 @@ def segmentation_regular(
14381438

14391439

14401440
def fill_segmentation(
1441-
df_segm: pd.DataFrame,
1442-
df_feat: pd.DataFrame,
1441+
df_segmentation: pd.DataFrame,
1442+
df_features: pd.DataFrame,
14431443
id_discrete: list[str],
14441444
id_continuous: list[str],
14451445
dict_agg: dict[str, list[str]] | None = None
@@ -1449,9 +1449,9 @@ def fill_segmentation(
14491449
14501450
Parameters
14511451
----------
1452-
df_segm: pd.DataFrame
1452+
df_segmentation: pd.DataFrame
14531453
the dataframe containing the segmentation. Should contain only columns id_discrete and id_continuous
1454-
df_feat: pd.DataFrame
1454+
df_features: pd.DataFrame
14551455
the dataframe containing the features to fit to the segmentation. Should contain the columns
14561456
id_discrete and id_continuous as well as other columns for the features of interest.
14571457
id_discrete
@@ -1465,14 +1465,14 @@ def fill_segmentation(
14651465
"""
14661466
# verification of requirements
14671467
for col in id_continuous + id_discrete:
1468-
if col not in df_segm.columns or col not in df_feat.columns:
1468+
if col not in df_segmentation.columns or col not in df_features.columns:
14691469
raise Exception(f"Error: {col} is not present in both dataframes df_segm and df_feat.")
14701470

14711471
is_df_segm_admissible = tools.admissible_dataframe(
1472-
data=df_segm, id_discrete=id_discrete, id_continuous=id_continuous
1472+
data=df_segmentation, id_discrete=id_discrete, id_continuous=id_continuous
14731473
)
14741474
is_df_feat_admissible = tools.admissible_dataframe(
1475-
data=df_feat, id_discrete=id_discrete, id_continuous=id_continuous
1475+
data=df_features, id_discrete=id_discrete, id_continuous=id_continuous
14761476
)
14771477
if not is_df_segm_admissible or not is_df_feat_admissible:
14781478
raise Exception("Error: Both dataframes should be admissible:"
@@ -1481,9 +1481,9 @@ def fill_segmentation(
14811481

14821482
# homogenize_between() reduces the difference in segment size between df_feat and df_segm. More precisely, it
14831483
# adjusts df_feat to df_segm. This may reduce the risk of error when using merge().
1484-
df_segm, df_feat = homogenize_between(
1485-
df1=df_segm,
1486-
df2=df_feat,
1484+
df_segmentation, df_features = homogenize_between(
1485+
df1=df_segmentation,
1486+
df2=df_features,
14871487
id_discrete=id_discrete,
14881488
id_continuous=id_continuous,
14891489
dict_agg_df1=None,
@@ -1492,13 +1492,13 @@ def fill_segmentation(
14921492
verbose=False
14931493
)
14941494

1495-
df_segm["__id__"] = 1
1496-
df_segm["__id__"] = df_segm["__id__"].cumsum()
1495+
df_segmentation["__id__"] = 1
1496+
df_segmentation["__id__"] = df_segmentation["__id__"].cumsum()
14971497

14981498
# merging the segmentations in both df
14991499
df_merge = merge(
1500-
data_left=df_segm,
1501-
data_right=df_feat,
1500+
data_left=df_segmentation,
1501+
data_right=df_features,
15021502
id_continuous=id_continuous,
15031503
id_discrete=id_discrete,
15041504
how="left",

doc/requirements.txt

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -7,5 +7,4 @@ nbsphinx
77
sphinx-autoapi
88
sphinx-version-warning
99
sphinx-prompt
10-
numpydoc
11-
pandas
10+
numpydoc

test/conftest.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -9,13 +9,13 @@
99

1010
@fixture(scope="module")
1111
def get_examples():
12-
df_left = pd.read_csv("../data/base_left.csv")
13-
df_right = pd.read_csv("../data/base_right.csv")
12+
df_left = pd.read_csv("data/base_left.csv")
13+
df_right = pd.read_csv("data/base_right.csv")
1414
return df_left, df_right
1515

1616

1717
@fixture(scope="module")
1818
def get_advanced_examples():
19-
df_left = pd.read_csv("../data/advanced_left.csv")
20-
df_right = pd.read_csv("../data/advanced_right.csv")
19+
df_left = pd.read_csv("data/advanced_left.csv")
20+
df_right = pd.read_csv("data/advanced_right.csv")
2121
return df_left, df_right

test/test_base.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -849,8 +849,8 @@ def test_fill_segmentation():
849849
"data2": [1, 0, 1, 1, 0, 1, 0, 0],
850850
})
851851
df_test = fill_segmentation(
852-
df_segm=df_segm,
853-
df_feat=df_feat,
852+
df_segmentation=df_segm,
853+
df_features=df_feat,
854854
id_discrete=["discr1"],
855855
id_continuous=["cont1", "cont2"],
856856
dict_agg={"mean": ["data1"], "sum": ["data2"]}

test/test_tools.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -11,7 +11,7 @@
1111

1212
id_discrete, id_continuous = ["id", "id2"], ["t1", "t2"]
1313

14-
data = pd.read_csv("../examples/data/data_zones.csv")
14+
data = pd.read_csv("examples/data/data_zones.csv")
1515

1616

1717
def test_no_overlapping(get_examples):

0 commit comments

Comments
 (0)