Source code for cytoflowgui.workflow.operations.kmeans

#!/usr/bin/env python3.8
# coding: latin-1

# (c) Massachusetts Institute of Technology 2015-2018
# (c) Brian Teague 2018-2022
#
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 2 of the License, or
# (at your option) any later version.
# 
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
# 
# You should have received a copy of the GNU General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.

"""
cytoflowgui.workflow.operations.kmeans
--------------------------------------

"""

from traits.api import (provides, Instance, Str, Property, observe, Constant,
                        List, Dict, Any, DelegatesTo)

import sklearn.cluster 

from cytoflow.operations.kmeans import KMeansOp, KMeans2DView
import cytoflow.utility as util

from ..views import IWorkflowView, WorkflowByView, ScatterplotPlotParams
from ..serialization import camel_registry, traits_str, cytoflow_class_repr, dedent
from ..subset import ISubset

from .operation_base import IWorkflowOperation, WorkflowOperation

KMeansOp.__repr__ = cytoflow_class_repr


[docs]
@provides(IWorkflowOperation)
class KMeansWorkflowOp(WorkflowOperation, KMeansOp):
    # add "apply", "estimate" metadata
    name = Str(apply = True)
    xchannel = Str(estimate = True)
    ychannel = Str(estimate = True)
    xscale = util.ScaleEnum(estimate = True)
    yscale = util.ScaleEnum(estimate = True)
    num_clusters = util.PositiveCInt(2, allow_zero = False, estimate = True)
    
    by = List(Str, estimate = True)
    
    # add the 'estimate_result' metadata
    _kmeans = Dict(Any, Instance(sklearn.cluster.MiniBatchKMeans), transient = True,
                   estimate_result = True)
        
    # override the base class's "subset" with one that is dynamically generated /
    # updated from subset_list
    subset = Property(Str, observe = "subset_list.items.str")
    subset_list = List(ISubset, estimate = True)
        
    # bits to support the subset editor
    @observe('subset_list:items.str')
    def _on_subset_changed(self, _):
        self.changed = 'subset_list'
        
    # MAGIC - returns the value of the "subset" Property, above
    def _get_subset(self):
        return " and ".join([subset.str for subset in self.subset_list if subset.str])
            

[docs]
    def default_view(self, **kwargs):
        return KMeansWorkflowView(op = self, **kwargs)

    

[docs]
    def estimate(self, experiment):
        if not self.xchannel:
            raise util.CytoflowOpError('xchannel',
                                       "Must set X channel")
            
        if not self.ychannel:
            raise util.CytoflowOpError('ychannel',
                                       "Must set Y channel")
        
        self.channels = [self.xchannel, self.ychannel]
        self.scale = {self.xchannel : self.xscale,
                      self.ychannel : self.yscale}
        
        super().estimate(experiment, subset = self.subset)

        

[docs]
    def apply(self, experiment):
        if not self._kmeans:
            raise util.CytoflowOpError(None, 'Click "Estimate"!')
        return KMeansOp.apply(self, experiment)

    

[docs]
    def clear_estimate(self):
        self._kmeans = {}      
        self._scale = {}

    

[docs]
    def get_notebook_code(self, idx):
        op = KMeansOp()
        op.copy_traits(self, op.copyable_trait_names())     
        op.channels = [self.xchannel, self.ychannel] 
        op.scale = {self.xchannel : self.xscale,
                    self.ychannel : self.yscale}

        return dedent("""
        op_{idx} = {repr}
        
        op_{idx}.estimate(ex_{prev_idx}{subset})
        ex_{idx} = op_{idx}.apply(ex_{prev_idx})
        """
        .format(repr = repr(op),
                idx = idx,
                prev_idx = idx - 1,
                subset = ", subset = " + repr(self.subset) if self.subset else ""))


        
        

[docs]
@provides(IWorkflowView)
class KMeansWorkflowView(WorkflowByView):
    op = Instance(IWorkflowOperation, fixed = True)
    subset = DelegatesTo('op')
    by = DelegatesTo('op')
    xchannel = DelegatesTo('op')
    xscale = DelegatesTo('op')
    ychannel = DelegatesTo('op')
    yscale = DelegatesTo('op')
    
    plot_params = Instance(ScatterplotPlotParams, ())
    
    id = "cytoflowgui.op_plugins.kmeans"
    friendly_id = "KMeans" 
    
    name = Constant("KMeans")
    

[docs]
    def plot(self, experiment, **kwargs):
        KMeans2DView(op = self.op,
                     xchannel = self.xchannel,
                     ychannel = self.ychannel,
                     xscale = self.xscale,
                     yscale = self.yscale).plot(experiment, 
                                                **kwargs)

                     

[docs]
    def enum_plots(self, experiment):
        return KMeans2DView(op = self.op,
                            xchannel = self.xchannel,
                            ychannel = self.ychannel,
                            xscale = self.xscale,
                            yscale = self.yscale).enum_plots(experiment)

            

[docs]
    def get_notebook_code(self, idx):
        view = KMeans2DView()
        trait_names = view.copyable_trait_names()
        trait_names.remove('xchannel')
        trait_names.remove('xscale')
        trait_names.remove('ychannel')
        trait_names.remove('yscale')
        view.copy_traits(self, trait_names)
        view.subset = self.subset
        plot_params_str = traits_str(self.plot_params)
        
        return dedent("""
        op_{idx}.default_view({traits}).plot(ex_{idx}{plot}{plot_params})
        """
        .format(traits = traits_str(view),
                idx = idx,
                plot = ", plot_name = " + repr(self.current_plot) if self.current_plot else "",
                plot_params = ", " + plot_params_str if plot_params_str else ""))


        
        
@camel_registry.dumper(KMeansWorkflowOp, 'kmeans', version = 1)
def _dump(op):
    return dict(name = op.name,
                xchannel = op.xchannel,
                ychannel = op.ychannel,
                xscale = op.xscale,
                yscale = op.yscale,
                num_clusters = op.num_clusters,
                subset_list = op.subset_list)
    
@camel_registry.loader('kmeans', version = 1)
def _load(data, version):
    return KMeansWorkflowOp(**data)

@camel_registry.dumper(KMeansWorkflowView, 'kmeans-view', version = 2)
def _dump_view(view):
    return dict(op = view.op,
                plot_params = view.plot_params,
                current_plot = view.current_plot)
    
@camel_registry.dumper(KMeansWorkflowView, 'kmeans-view', version = 1)
def _dump_view_v1(view):
    return dict(op = view.op)

@camel_registry.loader('kmeans-view', version = any)
def _load_view(data, ver):
    return KMeansWorkflowView(**data)