# Ordered Clustering
This module shows an example of how to use the "Ordered clustering" module

In [1]:
%config Completer.use_jedi = False

## Definition of inputs and problem formalization

In [2]:
import pandas as pd
from modular_parts.M3_PrometheePreference import compute_preference_indices
from modular_parts.M25_OrderedClustering import group_into_ordered_clusters
from core.enums import Direction, GeneralCriterion

alternatives = [f"a{i}" for i in range(1, 8)]
profiles = [f"p{i}" for i in range(1, 4)]
criteria = [f"c{i}" for i in range(1, 4)]
criteria_directions = pd.Series([Direction.MAX, Direction.MIN, Direction.MAX], index=criteria)
criteria_weights = pd.Series([0.3, 0.2, 0.5], index=criteria)
generalised_criteria = pd.Series([GeneralCriterion.U_SHAPE,
                                  GeneralCriterion.V_SHAPE_INDIFFERENCE,
                                  GeneralCriterion.USUAL], index=criteria)
preference_thresholds = pd.Series([2, 10, None], index=criteria)
indifference_thresholds = pd.Series([1, 5, None], index=criteria)
standard_deviations = pd.Series([None, None, None], index=criteria) # None, because we do not use GeneralCriterion.GAUSSIAN

alternatives_performances = pd.DataFrame([[15, 83, 21],
                                          [10, 90, 15],
                                          [11, 75, 20],
                                          [18, 59, 20],
                                          [17, 60, 28],
                                          [22, 44, 15],
                                          [13, 62, 22]], index=alternatives, columns=criteria)

## Required preferences

In [3]:
aggregated_alternatives_preferences, _ = compute_preference_indices(alternatives_performances,
                                                                    preference_thresholds,
                                                                    indifference_thresholds,
                                                                    standard_deviations,
                                                                    generalised_criteria,
                                                                    criteria_directions,
                                                                    criteria_weights)
aggregated_alternatives_preferences

Unnamed: 0,a1,a2,a3,a4,a5,a6,a7
a1,0.0,0.88,0.8,0.5,0.0,0.5,0.3
a2,0.0,0.0,0.0,0.0,0.0,0.0,0.0
a3,0.12,0.7,0.0,0.0,0.0,0.5,0.0
a4,0.5,1.0,0.5,0.0,0.0,0.5,0.3
a5,1.0,1.0,1.0,0.5,0.0,0.5,0.8
a6,0.5,0.5,0.5,0.5,0.5,0.0,0.5
a7,0.7,1.0,1.0,0.5,0.0,0.5,0.0


## Ordered Clustering

In [4]:
clusters = group_into_ordered_clusters(aggregated_alternatives_preferences, k=3)
clusters

C1        [a4, a5]
C2        [a1, a7]
C3    [a2, a3, a6]
Name: Alternatives in clusters, dtype: object

### Change output format

In [5]:
from core.clusters_commons import change_clusters_output

change_clusters_output(clusters)

a1    C2
a2    C3
a3    C3
a4    C1
a5    C1
a6    C3
a7    C2
dtype: object