Source code for cellpy.utils.batch_tools.batch_plotters

import itertools
import logging
import sys
import warnings
from collections import defaultdict

import numpy as np
import pandas as pd

from cellpy import prms
from cellpy.exceptions import UnderDefined
from cellpy.parameters.internal_settings import get_headers_journal, get_headers_summary
from cellpy.utils.batch_tools.batch_core import BasePlotter
from cellpy.utils.batch_tools.batch_experiments import CyclingExperiment

# TODO: add palette to prms.Batch

try:
    import bokeh

except ImportError:
    prms.Batch.backend = "matplotlib"
    logging.debug("could not import bokeh -> using matplotlib instead")

hdr_journal = get_headers_journal()
hdr_summary = get_headers_summary()


# print(prms.Batch.backend)


[docs]def create_legend(info, c, option="clean", use_index=False): """creating more informative legends""" logging.debug(" - creating legends") mass, loading, label = info.loc[ c, [hdr_journal["mass"], hdr_journal["loading"], hdr_journal["label"]] ] if use_index or not label: label = c.split("_") label = "_".join(label[1:]) if option == "clean": logging.debug(f"label: {label}") return label if option == "mass": label = f"{label} ({mass:.2f} mg)" elif option == "loading": label = f"{label} ({loading:.2f} mg/cm2)" elif option == "all": label = f"{label} ({mass:.2f} mg) ({loading:.2f} mg/cm2)" logging.debug(f"advanced label: {label}") return label
[docs]def look_up_group(info, c): logging.debug(" - looking up groups") g, sg = info.loc[c, [hdr_journal["group"], hdr_journal["sub_group"]]] return int(g), int(sg)
[docs]def create_plot_option_dicts( info, marker_types=None, colors=None, line_dash=None, size=None, palette=None ): """Create two dictionaries with plot-options. The first iterates colors (based on group-number), the second iterates through marker types. Returns: group_styles (dict), sub_group_styles (dict) """ logging.debug(" - creating plot-options-dict (for bokeh)") if palette is None: try: # palette = bokeh.palettes.brewer['YlGnBu'] palette = bokeh.palettes.d3["Category20"] # palette = bokeh.palettes.brewer[prms.Batch.bokeh_palette'] except (NameError, AttributeError) as e: logging.info(f"could not create the palette {e}") palette = { 1: ["k"], 3: ["k", "r"], 4: ["k", "r", "b"], 5: ["k", "r", "b", "g"], 6: ["k", "r", "b", "g", "c"], 7: ["k", "r", "b", "g", "c", "m"], 8: ["k", "r", "b", "g", "c", "m", "y"], } max_palette_row = max(palette.keys()) if marker_types is None: marker_types = [ "circle", "square", "triangle", "inverted_triangle", "diamond", "asterisk", "cross", ] if line_dash is None: line_dash = [0, 0] if size is None: size = 10 groups = info[hdr_journal.group].unique() number_of_groups = len(groups) if colors is None: if number_of_groups < 4: colors = palette[3] else: colors = palette[min(max_palette_row, number_of_groups)] sub_groups = info[hdr_journal.sub_group].unique() marker_it = itertools.cycle(marker_types) colors_it = itertools.cycle(colors) group_styles = dict() sub_group_styles = dict() for j in groups: color = next(colors_it) marker_options = {"line_color": color, "fill_color": color} line_options = {"line_color": color} group_styles[j] = {"marker": marker_options, "line": line_options} for j in sub_groups: marker_type = next(marker_it) marker_options = {"marker": marker_type, "size": size} line_options = {"line_dash": line_dash} sub_group_styles[j] = {"marker": marker_options, "line": line_options} return group_styles, sub_group_styles
[docs]def create_summary_plot_bokeh( data, info, group_styles, sub_group_styles, label=None, title="Capacity", x_axis_label="Cycle number", y_axis_label="Capacity (mAh/g)", width=900, height=400, legend_option="clean", legend_location="bottom_right", x_range=None, y_range=None, tools="hover", ): # TODO: include max cycle (bokeh struggles when there is to much to plot) # could also consider interpolating # or defaulting to datashader for large files. warnings.warn( "This utility function will be seriously removed and replaced with a plotly version soon.", category=DeprecationWarning, ) logging.debug(f" - creating summary (bokeh) plot for {label}") discharge_capacity = None if isinstance(data, (list, tuple)): charge_capacity = data[0] if len(data) == 2: discharge_capacity = data[1] else: charge_capacity = data p = bokeh.plotting.figure( title=title, width=width, height=height, # tools = tools, x_range=x_range, y_range=y_range, x_axis_label=x_axis_label, y_axis_label=y_axis_label, ) sub_cols_charge = None sub_cols_discharge = None legend_collection = [] if isinstance(charge_capacity.columns, pd.MultiIndex): cols = charge_capacity.columns.get_level_values(1) sub_cols_charge = charge_capacity.columns.get_level_values(0).unique() charge_capacity.columns = [ f"{col[0]}_{col[1]}" for col in charge_capacity.columns.values ] if discharge_capacity is not None: sub_cols_discharge = discharge_capacity.columns.get_level_values(0).unique() discharge_capacity.columns = [ f"{col[0]}_{col[1]}" for col in discharge_capacity.columns.values ] else: cols = charge_capacity.columns logging.debug("iterate cols") for cc in cols: g, sg = look_up_group(info, cc) legend_items = [] l = create_legend(info, cc, option=legend_option) group_props = group_styles[g] sub_group_props = sub_group_styles[sg] logging.debug(f"subgroups {sub_group_props}") if sub_cols_charge is not None: c = f"{sub_cols_charge[0]}_{cc}" r = f"{sub_cols_charge[1]}_{cc}" if c not in charge_capacity.columns: charge_capacity[c] = np.nan if r not in charge_capacity.columns: charge_capacity[r] = np.nan selector = [c, r] charge_capacity_sub = charge_capacity.loc[:, selector] charge_capacity_sub.columns = [c, "rate"] charge_source = bokeh.models.ColumnDataSource(charge_capacity_sub) else: c = cc if c not in charge_capacity.columns: charge_capacity[c] = np.nan charge_capacity_sub = charge_capacity.loc[:, [c]] charge_source = bokeh.models.ColumnDataSource(charge_capacity_sub) logging.debug(f"starting creating scatter") ch_m = p.scatter( source=charge_source, x=hdr_summary.cycle_index, y=c, # **legend_option_dict, # Remark! cannot use the same legend name as # column name (defaults to a lookup) **group_props["marker"], # color **sub_group_props["marker"], # marker ) logging.debug(f"starting creating line") ch_l = p.line( source=charge_source, x=hdr_summary.cycle_index, y=c, **group_props["line"], **sub_group_props["line"], ) legend_items.extend([ch_m, ch_l]) logging.debug(f"fixing discharge cap") if discharge_capacity is not None: # creating a local copy so that I can do local changes group_props_marker_charge = group_props["marker"].copy() group_props_marker_charge["fill_color"] = None if sub_cols_discharge is not None: c = f"{sub_cols_discharge[0]}_{cc}" r = f"{sub_cols_discharge[1]}_{cc}" if c not in charge_capacity.columns: charge_capacity[c] = np.nan if r not in charge_capacity.columns: charge_capacity[r] = np.nan discharge_capacity_sub = discharge_capacity.loc[:, [c, r]] discharge_capacity_sub.columns = [c, "rate"] discharge_source = bokeh.models.ColumnDataSource(discharge_capacity_sub) else: c = cc if c not in charge_capacity.columns: charge_capacity[c] = np.nan discharge_capacity_sub = discharge_capacity.loc[:, [c]] discharge_source = bokeh.models.ColumnDataSource(discharge_capacity_sub) dch_m = p.scatter( source=discharge_source, x=hdr_summary.cycle_index, y=c, **group_props_marker_charge, **sub_group_props["marker"], ) dch_l = p.line( source=discharge_source, x=hdr_summary.cycle_index, y=c, **group_props["line"], **sub_group_props["line"], ) legend_items.extend([dch_m, dch_l]) legend_collection.append((l, legend_items)) logging.debug("exiting summary plotter") return p, legend_collection
[docs]def plot_cycle_life_summary_bokeh( info, summaries, width=900, height=800, height_fractions=None, legend_option="all", add_rate=True, **kwargs, ): # TODO: This function should be refactored! if height_fractions is None: height_fractions = [0.3, 0.4, 0.3] logging.debug(f" * stacking and plotting") logging.debug(f" backend: {prms.Batch.backend}") logging.debug(f" received kwargs: {kwargs}") idx = pd.IndexSlice all_legend_items = [] warnings.warn( "This utility function will be removed shortly", category=DeprecationWarning ) if add_rate: try: discharge_capacity = summaries.loc[ :, idx[ [ hdr_summary["discharge_capacity_gravimetric"], hdr_summary["discharge_c_rate"], ], :, ], ] except AttributeError: warnings.warn( "No discharge rate columns available - consider re-creating summary!" ) discharge_capacity = summaries[ hdr_summary["discharge_capacity_gravimetric"] ] try: charge_capacity = summaries.loc[ :, idx[ [ hdr_summary["charge_capacity_gravimetric"], hdr_summary["charge_c_rate"], ], :, ], ] except AttributeError: warnings.warn( "No charge rate columns available - consider re-creating summary!" ) charge_capacity = summaries[hdr_summary["charge_capacity_gravimetric"]] try: coulombic_efficiency = summaries.loc[ :, idx[[hdr_summary.coulombic_efficiency, hdr_summary.charge_c_rate], :] ] except AttributeError: warnings.warn( "No charge rate columns available - consider re-creating summary!" ) coulombic_efficiency = summaries.coulombic_efficiency if hdr_summary.ir_charge in summaries.columns: try: ir_charge = summaries.loc[ :, idx[[hdr_summary.ir_charge, hdr_summary.charge_c_rate], :] ] except AttributeError: warnings.warn( "No charge rate columns available - consider re-creating summary!" ) ir_charge = summaries.ir_charge else: ir_charge = pd.DataFrame() else: discharge_capacity = summaries[hdr_summary["discharge_capacity_gravimetric"]] charge_capacity = summaries[hdr_summary["charge_capacity_gravimetric"]] coulombic_efficiency = summaries[hdr_summary["coulombic_efficiency"]] ir_charge = summaries[hdr_summary["ir_charge"]] h_eff = int(height_fractions[0] * height) h_cap = int(height_fractions[1] * height) h_ir = int(height_fractions[2] * height) group_styles, sub_group_styles = create_plot_option_dicts(info) p_eff, legends_eff = create_summary_plot_bokeh( coulombic_efficiency, info, group_styles, sub_group_styles, label="c.e.", legend_option=legend_option, title=None, x_axis_label=None, y_axis_label="Coulombic efficiency (%)", width=width, height=h_eff, ) all_legend_items.extend(legends_eff) if not ir_charge.empty: cap_x_axis = None else: cap_x_axis = "Cycle number" p_cap, legends_cap = create_summary_plot_bokeh( (charge_capacity, discharge_capacity), info, group_styles, sub_group_styles, legend_option=legend_option, label="charge and discharge cap.", title=None, x_axis_label=cap_x_axis, height=h_cap, width=width, x_range=p_eff.x_range, ) all_legend_items.extend(legends_cap) if not ir_charge.empty: p_ir, legends_ir = create_summary_plot_bokeh( ir_charge, info, group_styles, sub_group_styles, label="ir charge", legend_option=legend_option, title=None, x_axis_label="Cycle number", y_axis_label="IR Charge (Ohm)", width=width, height=h_ir, x_range=p_eff.x_range, ) all_legend_items.extend(legends_ir) p_eff.y_range.start, p_eff.y_range.end = 20, 120 p_eff.xaxis.visible = False if not ir_charge.empty: p_cap.xaxis.visible = False tooltips = [("cycle", f"@{hdr_summary.cycle_index}"), ("value", "$y{0.}")] if add_rate: tooltips.append(("rate", "@rate{0.000}")) hover = bokeh.models.HoverTool(tooltips=tooltips) p_eff.add_tools(hover) p_cap.add_tools(hover) if not ir_charge.empty: p_ir.add_tools(hover) renderer_list = p_eff.renderers + p_cap.renderers if not ir_charge.empty: renderer_list += p_ir.renderers legend_items_dict = defaultdict(list) for label, r in all_legend_items: legend_items_dict[label].extend(r) legend_items = [] renderer_list = [] for legend in legend_items_dict: legend_items.append( bokeh.models.LegendItem(label=legend, renderers=legend_items_dict[legend]) ) renderer_list.extend(legend_items_dict[legend]) legend_title = "Legends" dummy_figure_for_legend = bokeh.plotting.figure( plot_width=300, plot_height=height, outline_line_alpha=0, toolbar_location=None, width_policy="min", min_width=300, title=legend_title, ) # set the components of the figure invisible for fig_component in [ dummy_figure_for_legend.grid[0], dummy_figure_for_legend.ygrid[0], dummy_figure_for_legend.xaxis[0], dummy_figure_for_legend.yaxis[0], ]: fig_component.visible = False dummy_figure_for_legend.renderers += renderer_list # set the figure range outside the range of all # glyphs (assuming that negative cycle numbers never happen) dummy_figure_for_legend.x_range.start, dummy_figure_for_legend.x_range.end = ( -10, -9, ) dummy_figure_for_legend.add_layout( bokeh.models.Legend( click_policy="hide", location="top_left", border_line_alpha=0, items=legend_items, ) ) dummy_figure_for_legend.title.align = "center" grid_layout = [p_eff, p_cap] if not ir_charge.empty: grid_layout.append(p_ir) fig_grid = bokeh.layouts.gridplot(grid_layout, ncols=1, sizing_mode="stretch_width") info_text = "(filled:charge) (open:discharge)" if not ir_charge.empty: p_ir.add_layout(bokeh.models.Title(text=info_text, align="right"), "below") else: p_cap.add_layout(bokeh.models.Title(text=info_text, align="right"), "below") final_figure = bokeh.layouts.row( children=[fig_grid, dummy_figure_for_legend], sizing_mode="stretch_width" ) return bokeh.plotting.show(final_figure)
[docs]def plot_cycle_life_summary_matplotlib( info, summaries, width=900, height=800, height_fractions=None, legend_option="all", **kwargs, ): warnings.warn( "This utility function will be seriously changed soon and possibly removed", category=DeprecationWarning, ) import matplotlib.pyplot as plt logging.debug(f" * stacking and plotting") logging.debug(f" backend: {prms.Batch.backend}") logging.debug(f" received kwargs: {kwargs}") # Not used (yet?) - requires a more advanced generation of sub-plots if height_fractions is None: height_fractions = [0.3, 0.4, 0.3] # print(" running matplotlib plotter ".center(80,"=")) # convert from bokeh to matplotlib - figsize - inch-ish width /= 80 height /= 120 discharge_capacity = summaries[hdr_summary["discharge_capacity_gravimetric"]] charge_capacity = summaries[hdr_summary["charge_capacity_gravimetric"]] coulombic_efficiency = summaries.coulombic_efficiency try: ir_charge = summaries.ir_charge except AttributeError: logging.debug("the data is missing ir charge") ir_charge = None plt.rcParams["figure.figsize"] = (10, 10) marker_types = [ "o", "s", "v", "^", "<", ">", "8", "p", "P", "*", "h", "H", "+", "x", "X", "D", "d", ".", ",", ] marker_size = kwargs.pop("marker_size", None) group_styles, sub_group_styles = create_plot_option_dicts( info, marker_types=marker_types, size=marker_size ) if ir_charge is None: canvas, (ax_ce, ax_cap) = plt.subplots( 2, 1, figsize=(width, height), sharex=True, gridspec_kw={"height_ratios": height_fractions[:-1]}, ) else: canvas, (ax_ce, ax_cap, ax_ir) = plt.subplots( 3, 1, figsize=(width, height), sharex=True, gridspec_kw={"height_ratios": height_fractions}, ) for label in charge_capacity.columns.get_level_values(0): name = create_legend(info, label, option=legend_option) g, sg = look_up_group(info, label) group_style = group_styles[g] sub_group_style = sub_group_styles[sg] marker = sub_group_style["marker"] line = group_style["line"] c = line["line_color"] m = marker["marker"] f = "white" try: ax_cap.plot( charge_capacity[label], label=name, color=c, marker=m, markerfacecolor=c ) except Exception as e: logging.debug(f"Could not plot charge capacity for {label} ({e})") try: ax_cap.plot( discharge_capacity[label], label=name, color=c, marker=m, markerfacecolor=f, ) except Exception as e: logging.debug(f"Could not plot discharge capacity for {label} ({e})") ax_ce.plot( coulombic_efficiency[label], label=name, color=c, marker=m, markerfacecolor=c, ) if ir_charge is not None: try: ax_ir.plot( ir_charge[label], color=c, label=name, marker=m, markerfacecolor=c ) except Exception as e: logging.debug(f"Could not plot IR for {label} ({e})") ax_all = [ax_cap, ax_ce] ax_ce.set_ylabel("Coulombic\nEfficiency (%)") ax_ce.set_ylim((0, 110)) ax_cap.set_ylabel("Capacity\n(mAh/g)") if ir_charge is not None: ax_ir.set_ylabel("IR\n(charge)") ax_ir.set_xlabel("Cycle") ax_all.append(ax_ir) else: ax_cap.set_xlabel("Cycle") for ax in ax_all: box = ax.get_position() ax.set_position([box.x0, box.y0, box.width * 0.6, box.height]) # Put a legend to the right of the current axis legend = ax_cap.legend(loc="center left", bbox_to_anchor=(1, 0.5)) legend.get_frame().set_facecolor("none") legend.get_frame().set_linewidth(0.0) return canvas
[docs]def summary_plotting_engine(**kwargs): """creates plots of summary data.""" warnings.warn( "This utility function will be seriously changed soon and possibly removed", category=DeprecationWarning, ) logging.debug(f"Using {prms.Batch.backend} for plotting") experiments = kwargs.pop("experiments") farms = kwargs.pop("farms") barn = None logging.debug(" - summary_plot_engine") farms = _preparing_data_and_plotting(experiments=experiments, farms=farms, **kwargs) return farms, barn
def _plotting_data(pages, summaries, width, height, height_fractions, **kwargs): # sub-sub-engine canvas = None if prms.Batch.backend == "bokeh": canvas = plot_cycle_life_summary_bokeh( pages, summaries, width, height, height_fractions, **kwargs ) elif prms.Batch.backend == "matplotlib": logging.info("[obs! experimental]") canvas = plot_cycle_life_summary_matplotlib( pages, summaries, width, height, height_fractions, **kwargs ) else: logging.info(f"the {prms.Batch.backend} " f"back-end is not implemented yet.") return canvas def _preparing_data_and_plotting(**kwargs): # sub-engine logging.debug(" - _preparing_data_and_plotting") experiments = kwargs.pop("experiments") farms = kwargs.pop("farms") width = kwargs.pop("width", prms.Batch.summary_plot_width) height = kwargs.pop("height", prms.Batch.summary_plot_height) height_fractions = kwargs.pop( "height_fractions", prms.Batch.summary_plot_height_fractions ) for experiment in experiments: if not isinstance(experiment, CyclingExperiment): logging.info( "No! This engine is only really good at processing CyclingExperiments" ) logging.info(experiment) else: pages = experiment.journal.pages try: keys = [df.name for df in experiment.memory_dumped["summary_engine"]] summaries = pd.concat( experiment.memory_dumped["summary_engine"], keys=keys, axis=1 ) canvas = _plotting_data( pages, summaries, width, height, height_fractions, **kwargs ) farms.append(canvas) except KeyError: logging.info("could not parse the summaries") logging.info(" - might be new a bug?") logging.info( " - might be a known bug related to dropping cells (b.drop)" ) logging.info(" - maybe try reloading the data helps?") return farms
[docs]def exporting_plots(**kwargs): # dumper experiments = kwargs["experiments"] farms = kwargs["farms"] barn = kwargs["barn"] engine = kwargs["engine"] return None
[docs]class CyclingSummaryPlotter(BasePlotter): def __init__(self, *args, reset_farms=True): """ Attributes (inherited): experiments: list of experiments. farms: list of farms (containing pandas DataFrames or figs). barn (str): identifier for where to place the output-files. reset_farms (bool): empty the farms before running the engine. """ super().__init__(*args) self.engines = list() self.dumpers = list() self.reset_farms = reset_farms self._use_dir = None self.current_engine = None self._assign_engine(summary_plotting_engine) self._assign_dumper(exporting_plots) @property def columns(self): if len(self.experiments > 0): return self.experiments[0].summaries.columns.get_level_values(0) def _assign_engine(self, engine): self.engines.append(engine) def _assign_dumper(self, dumper): self.dumpers.append(dumper)
[docs] def run_engine(self, engine, **kwargs): """run engine (once pr. experiment). Args: engine: engine to run (function or method). The method issues the engine command (with experiments and farms as input) that returns an updated farms as well as the barn and assigns them both to self. The farms attribute is a list of farms, i.e. [farm1, farm2, ...], where each farm contains pandas DataFrames. The barns attribute is a pre-defined string used for picking what folder(s) the file(s) should be exported to. For example, if barn equals "batch_dir", the the file(s) will be saved to the experiments batch directory. The engine(s) is given self.experiments and self.farms as input and returns farms to self.farms and barn to self.barn. Thus, one could in principle modify self.experiments within the engine without explicitly 'notifying' the poor soul who is writing a batch routine using that engine. However, it is strongly advised not to do such things. And if you, as engine designer, really need to, then at least notify it through a debug (logger) statement. """ logging.debug("start engine::") self.current_engine = engine if self.reset_farms: self.farms = [] self.farms, self.barn = engine( experiments=self.experiments, farms=self.farms, **kwargs ) logging.debug("::engine ended")
[docs] def run_dumper(self, dumper): """run dumber (once pr. engine) Args: dumper: dumper to run (function or method). The dumper takes the attributes experiments, farms, and barn as input. It does not return anything. But can, if the dumper designer feels in a bad and nasty mood, modify the input objects (for example experiments). """ logging.debug("start dumper::") dumper( experiments=self.experiments, farms=self.farms, barn=self.barn, engine=self.current_engine, ) logging.debug("::dumper ended")
# def do(self): # if not self.experiments: # raise UnderDefined("cannot run until " "you have assigned an experiment") # # for engine in self.engines: # self.empty_the_farms() # logging.debug(f"running - {str(engine)}") # self.run_engine(engine) # # for dumper in self.dumpers: # logging.debug(f"exporting - {str(dumper)}") # self.run_dumper(dumper)
[docs]class EISPlotter(BasePlotter): def __init__(self): super().__init__()
[docs] def do(self): warnings.warn("not implemented yet")
if __name__ == "__main__": print("batch_plotters".center(80, "=")) csp = CyclingSummaryPlotter() eisp = EISPlotter() print("\n --> OK")