#!/usr/bin/env python3.8
# coding: latin-1
# (c) Massachusetts Institute of Technology 2015-2018
# (c) Brian Teague 2018-2022
#
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 2 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program. If not, see <http://www.gnu.org/licenses/>.
"""
cytoflow.views.parallel_coords
------------------------------
A parallel-coordinates plot.
`ParallelCoordinatesView` -- the `IView` class that makes the plot.
"""
from traits.api import provides, Constant
import matplotlib.pyplot as plt
import matplotlib.collections
import pandas as pd
import numpy as np
import cytoflow.utility as util
from .i_view import IView
from .base_views import BaseNDView
[docs]@provides(IView)
class ParallelCoordinatesView(BaseNDView):
"""
Plots a parallel coordinates plot. PC plots are good for multivariate
data; each vertical line represents one attribute, and one set of
connected line segments represents one data point.
Attributes
----------
Examples
--------
Make a little data set.
.. plot::
:context: close-figs
>>> import cytoflow as flow
>>> import_op = flow.ImportOp()
>>> import_op.tubes = [flow.Tube(file = "Plate01/RFP_Well_A3.fcs",
... conditions = {'Dox' : 10.0}),
... flow.Tube(file = "Plate01/CFP_Well_A4.fcs",
... conditions = {'Dox' : 1.0})]
>>> import_op.conditions = {'Dox' : 'float'}
>>> ex = import_op.apply()
Plot the PC plot.
.. plot::
:context: close-figs
>>> flow.ParallelCoordinatesView(channels = ['B1-A', 'V2-A', 'Y2-A', 'FSC-A'],
... scale = {'Y2-A' : 'log',
... 'V2-A' : 'log',
... 'B1-A' : 'log',
... 'FSC-A' : 'log'},
... huefacet = 'Dox').plot(ex)
"""
id = Constant('edu.mit.synbio.cytoflow.view.parallel_coords')
friend_id = Constant("Parallel Coordinates Plot")
[docs] def plot(self, experiment, **kwargs):
"""
Plot a faceted parallel coordinates plot
Parameters
----------
alpha : float (default = 0.02)
The alpha blending value, between 0 (transparent) and 1 (opaque).
axvlines_kwds : dict
A dictionary of parameters to pass to `ax.axvline <https://matplotlib.org/api/_as_gen/matplotlib.axes.Axes.axvline.html>`_
Notes
-----
This uses a low-level API for speed; there are far fewer visual options
that with other views.
"""
if len(self.channels) < 3:
raise util.CytoflowViewError('channels',
"Must have at least 3 channels")
super().plot(experiment, **kwargs)
# clean up the plot
for ax in plt.gcf().get_axes():
ax.set_xlabel("")
ax.set_ylabel("")
ax.get_yaxis().set_ticks([])
def _grid_plot(self, experiment, grid, **kwargs):
# xlim and ylim, xscale and yscale are the limits and scale of the
# plane onto which we are projecting. the kwargs 'scale' and 'lim'
# are the data scale and limits, respectively
scale = kwargs.pop('scale')
lim = kwargs.pop('lim')
# TODO - some way to optimize attribute order
# TODO - allow changing attribute spacing
# memo to track if we've put annotations on an axes yet
ax_annotations = {}
grid.map(_parallel_coords_plot,
*self.channels,
ax_annotations = ax_annotations,
scale = scale,
lim = lim,
**kwargs)
return {}
def _update_legend(self, legend):
for lh in legend.legendHandles:
lh.set_alpha(0.5)
lh.set_linewidth(3)
def _parallel_coords_plot(*channels, ax_annotations, scale, lim, **kwargs):
color = kwargs.pop('color')
alpha = kwargs.pop('alpha', 0.02)
aa = kwargs.pop('antialiased', True)
color = tuple(list(color) + [alpha])
label = kwargs.pop('label', None)
df = pd.DataFrame()
for c in channels:
vmin = lim[c.name][0]
vmax = lim[c.name][1]
c_scaled = pd.Series(data = scale[c.name].norm(vmin = vmin, vmax = vmax)(c.values),
index = c.index,
name = c.name)
c_scaled[(c < vmin) | (c > vmax)] = np.nan
df[c.name] = c_scaled
df.dropna(axis = 0, how = 'any', inplace = True)
# adapted from pandas.plotting._misc
axvlines_kwds = kwargs.pop('axvlines_kwds', {'linewidth' : 1, 'color' : 'black'})
ax = plt.gca()
# we're creating a LineCollection manually because it's much much much
# faster than the higher-level plotting routines
out = pd.Series()
for i in range(len(df.columns) - 1):
new_series = df.apply( lambda x: [(i, x[i]), (i + 1, x[i + 1])], axis = 1)
out = out.append(new_series)
lc = matplotlib.collections.LineCollection(out.values, colors = color, antialiaseds = aa)
lc.set_label(label)
ax.add_collection(lc)
# have we already annotated these axes?
if ax in ax_annotations:
return
ax_annotations[ax] = True
x = np.arange(len(df.columns))
for i in x:
ax.axvline(i, **axvlines_kwds)
ax.set_xticks(x)
ax.set_xticklabels(df.columns)
ax.set_xlim(x[0], x[-1])
ax.grid()
util.expand_class_attributes(ParallelCoordinatesView)
util.expand_method_parameters(ParallelCoordinatesView, ParallelCoordinatesView.plot)