Source code for immuneML.ml_methods.clustering.HDBSCAN

from immuneML.data_model.datasets.Dataset import Dataset
from immuneML.ml_methods.clustering.ClusteringMethod import ClusteringMethod, get_data_for_clustering
from sklearn.cluster import HDBSCAN as SklearnHDBSCAN


[docs] class HDBSCAN(ClusteringMethod): """ HDBSCAN method which wraps scikit-learn's clustering of the same name. Input arguments for the method are the same as supported by scikit-learn (see `DBSCAN scikit-learn documentation <https://scikit-learn.org/stable/modules/generated/sklearn.cluster.HDBSCAN.html>`_ for details). **YAML specification:** .. indent with spaces .. code-block:: yaml definitions: ml_methods: my_hdbscan: HDBSCAN: # arguments as defined by scikit-learn min_cluster_size: 5 """ def __init__(self, name=None, **kwargs): super().__init__(name) self.model = SklearnHDBSCAN(**kwargs)
[docs] def fit(self, dataset: Dataset): data = get_data_for_clustering(dataset) self.model.fit(data)
[docs] def fit_predict(self, dataset: Dataset): data = get_data_for_clustering(dataset) return self.model.fit_predict(data)
[docs] def predict(self, dataset: Dataset): raise RuntimeError("HDBSCAN Clustering does not support predict method")
[docs] def transform(self, dataset: Dataset): raise RuntimeError("HDBSCAN Clustering does not support transform method")