From bb042184b3dda44fb8cbedbb58975a0d7e52f286 Mon Sep 17 00:00:00 2001 From: MAFTOUH Mohammed Amine <mohammed-amine.maftouh@imt-atlantique.net> Date: Mon, 3 Mar 2025 10:58:27 +0000 Subject: [PATCH] =?UTF-8?q?ajout=20des=20metriques=20d'=C3=A9valuation=20d?= =?UTF-8?q?u=20clustering?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- clustering/mesures_clustering.py | 14 ++++++++++++++ 1 file changed, 14 insertions(+) create mode 100644 clustering/mesures_clustering.py diff --git a/clustering/mesures_clustering.py b/clustering/mesures_clustering.py new file mode 100644 index 0000000..ed08e4b --- /dev/null +++ b/clustering/mesures_clustering.py @@ -0,0 +1,14 @@ +def compute_silhouette_scores(reduced_embeddings, clustering_results): + """ + Calcule les scores de silhouette pour différents nombres de clusters. + + :param reduced_embeddings: Matrice des embeddings réduits + :param clustering_results: Dictionnaire contenant les labels prédits pour chaque nombre de clusters + :return: Dictionnaire des scores de silhouette + """ + silhouette_scores = {} + for n_clusters, labels in clustering_results.items(): + silhouette_avg = silhouette_score(reduced_embeddings, labels) + silhouette_scores[n_clusters] = silhouette_avg + print(f"Nombre de clusters: {n_clusters}, Silhouette Score: {silhouette_avg:.2f}") + return silhouette_scores \ No newline at end of file -- GitLab