|
5 | 5 | convert_categorical_to_continuous,
|
6 | 6 | convert_to_cuts,
|
7 | 7 | convert_to_intervals,
|
8 |
| - deduplicate_bins, |
| 8 | + remove_extra_bins, |
9 | 9 | make_bag,
|
10 | 10 | )
|
11 | 11 |
|
12 | 12 |
|
13 |
| -def test_deduplicate_bins(): |
| 13 | +def test_remove_extra_bins(): |
14 | 14 | bins = [
|
15 | 15 | [{"a": 1, "b": 2}, {"a": 2, "b": 1}, {"b": 2, "a": 1}, {"b": 2, "a": 1}],
|
16 | 16 | [
|
17 |
| - np.array([1, 2, 3], dtype=np.float64), |
18 | 17 | np.array([1, 3, 2], dtype=np.float64),
|
19 | 18 | np.array([1, 2, 3], dtype=np.float64),
|
| 19 | + np.array([1, 2, 3], dtype=np.float64), |
| 20 | + ], |
| 21 | + [ |
| 22 | + np.array([9, 8, 7], dtype=np.float64), |
20 | 23 | ],
|
| 24 | + [{"m": 1, "q": 2}], |
| 25 | + [{"r": 7, "t": 8}, {"r": 7, "t": 8}], |
| 26 | + [{"one": 1, "two": 2}], |
| 27 | + [{"never_used": 1, "never_ever": 2}], |
| 28 | + [], |
21 | 29 | ]
|
22 | 30 |
|
23 |
| - deduplicate_bins(bins) |
| 31 | + remove_extra_bins([(0, 1, 2, 3, 4), (5,)], bins) |
24 | 32 |
|
25 | 33 | assert len(bins[0]) == 3
|
26 |
| - assert id(bins[0][0]) != id(bins[0][1]) |
27 |
| - assert id(bins[0][0]) == id(bins[0][2]) |
28 |
| - assert id(bins[0][1]) != id(bins[0][2]) |
29 |
| - |
30 |
| - assert len(bins[1]) == 3 |
31 |
| - assert id(bins[1][0]) != id(bins[1][1]) |
32 |
| - assert id(bins[1][0]) == id(bins[1][2]) |
33 |
| - assert id(bins[1][1]) != id(bins[1][2]) |
| 34 | + assert len(bins[1]) == 2 |
| 35 | + assert len(bins[2]) == 1 |
| 36 | + assert len(bins[3]) == 1 |
| 37 | + assert len(bins[4]) == 1 |
| 38 | + assert len(bins[5]) == 1 |
| 39 | + assert len(bins[6]) == 0 |
| 40 | + assert len(bins[7]) == 0 |
34 | 41 |
|
35 | 42 |
|
36 | 43 | def test_conversion_cut_intervals():
|
|
0 commit comments