import inspect
from functools import singledispatch
from pathlib import Path
from pandas import DataFrame, Series
from mols2grid.molgrid import MolGrid
_SIGNATURE = {
method: dict(inspect.signature(getattr(MolGrid, method)).parameters.items())
for method in ["render", "to_interactive", "to_static", "display"]
}
for method in ["render", "to_interactive", "to_static", "display"]:
_SIGNATURE[method].pop("self")
if method in {"render", "display"}:
_SIGNATURE[method].pop("kwargs")
def _prepare_kwargs(kwargs, kind):
"""Separate kwargs for the init and render methods of MolGrid"""
template = kwargs.pop("template", _SIGNATURE["render"]["template"].default)
render_kwargs = {
param: kwargs.pop(param, sig.default)
for param, sig in _SIGNATURE[f"to_{template}"].items()
}
if kind == "display":
render_kwargs.update(
{
param: kwargs.pop(param, sig.default)
for param, sig in _SIGNATURE["display"].items()
}
)
return template, kwargs, render_kwargs
[docs]@singledispatch
def display(arg, **kwargs): # noqa: ARG001
"""Display molecules on an interactive grid.
Parameters: Data
----------------
arg : pandas.DataFrame, SDF file or list of molecules
The input containing your molecules.
smiles_col : str or None, default="SMILES"
If a pandas dataframe is used, name of the column with SMILES.
mol_col : str or None, default=None
If a pandas dataframe is used, name of the column with RDKit molecules.
If available, coordinates and atom/bonds annotations from this will be
used for depiction.
Parameters: Display
-------------------
template : str, default="interactive"
Either ``"interactive"`` or ``"static"``. See ``render()`` for more details.
size : tuple, default=(130, 90)
The size of the drawing canvas. The cell minimum width is set to the
width of the image, so if the cell padding is increased, the image will
be displayed smaller.
useSVG : bool, default=True
Use SVG images instead of PNG.
prerender : bool, default=False
Prerender images for the entire dataset, or generate them on-the-fly.
Prerendering is slow and memory-hungry, but required when ``template="static"``
or ``useSVG=False``.
subset: list or None, default=None
Columns to be displayed in each cell of the grid. Each column's
value will be displayed from top to bottom in the order provided.
The ``"img"`` and ``"mols2grid-id"`` columns are displayed by default,
however you can still add the ``"img"`` column if you wish to change
the display order.
tooltip : list, None or False, default=None
Columns to be displayed inside the tooltip. When no subset is set,
all columns will be listed in the tooltip by default. Use ``False``
to hide the tooltip.
tooltip_fmt : str, default="<strong>{key}</strong>: {value}"
Format string of each key/value pair in the tooltip.
tooltip_trigger : str, default="focus"
Only available for the "static" template.
Sequence of triggers for the tooltip: ``click``, ``hover`` or ``focus``
tooltip_placement : str, default="auto"
Position of the tooltip: ``auto``, ``top``, ``bottom``, ``left`` or
``right``
transform : dict or None, default=None
Functions applied to specific items in all cells. The dict must follow
a ``key: function`` structure where the key must correspond to one of
the columns in ``subset`` or ``tooltip``. The function takes the item's
value as input and transforms it, for example::
transform={
"Solubility": lambda x: f"{x:.2f}",
"Melting point": lambda x: f"MP: {5/9*(x-32):.1f}°C"
}
These transformations only affect columns in ``subset`` and
``tooltip``, and do not interfere with ``style``.
sort_by : str or None, default=None
Sort the grid according to the following field (which must be
present in ``subset`` or ``tooltip``).
truncate: bool, default=True/False
Whether to truncate the text in each cell if it's too long.
Defaults to ``True`` for interactive grids, ``False`` for static grid.
n_items_per_page, default=24
Only available for the "interactive" template.
Number of items to display per page. A multiple of 12 is recommended
for optimal display.
n_cols : int, default=5
Only available for the "static" template.
Number of columns in the table.
selection : bool, default=True
Only available for the "interactive" template.
Enables the selection of molecules and displays a checkbox at the
top of each cell. In the context of a Jupyter Notebook, this gives
you access to your selection (index and SMILES) through
:func:`mols2grid.get_selection()` or :meth:`MolGrid.get_selection()`.
In all cases, you can export your selection by clicking on the triple-dot menu.
cache_selection : bool, default=False
Only available for the "interactive" template.
Restores the selection from a previous grid with the same name.
use_iframe : bool, default=False
Whether to use an iframe to display the grid. When the grid is displayed
inside a Jupyter Notebook or JupyterLab, this will default to ``True``.
iframe_width : str, default="100%
Width of the iframe
iframe_height : int or None, default=None
Height of the frame. When set to ``None``, the height is set dynamically
based on the content.
Parameters: Mols
----------------
removeHs : bool, default=False
Remove hydrogen atoms from the drawings.
use_coords : bool, default=False
Use the coordinates of the molecules (only relevant when an SDF file, a
list of molecules or a DataFrame of RDKit molecules were used as input.)
coordGen : bool, default=True
Use the CoordGen library instead of the RDKit one to depict the
molecules in 2D.
MolDrawOptions : rdkit.Chem.Draw.rdMolDraw2D.MolDrawOptions or None, default=None
Drawing options. Useful for making highly customized drawings.
substruct_highlight : bool or None, default=None
Highlight substructure when using the SMARTS search. Active by default
when ``prerender=False``.
single_highlight : bool, default=False
Highlight only the first match of the substructure query.
Parameters: CSS
---------------
border : str, default="1px solid #cccccc"
Styling of the border around each cell.
gap : int, default=0
Size in pixels of the gap between cells.
pad : int, default=10
Size in pixels of the cell padding.
fontsize : str, default="12px"
Font size of the text displayed in each cell.
fontfamily : str, default="'DejaVu', sans-serif"
Font used for the text in each cell.
textalign : str, default="center"
Alignment of the text in each cell.
background_color : str, default="white"
Only available for the "interactive" template.
Background color of a cell.
hover_color : str, default="rgba(0,0,0,0.05)"
Only available for the "interactive" template.
Background color when hovering a cell
custom_css : str or None, default=None
Custom CSS properties applied to the generated HTML. Please note that
the CSS will apply to the entire page if no iframe is used (see
``use_iframe`` for more details).
style : dict or None, default=None
CSS styling applied to each item in a cell. The dict must follow a
``key: function`` structure where the key must correspond to one of the
columns in ``subset`` or ``tooltip``. The function takes the item's
value as input, and outputs a valid CSS styling. For example, if you
want to color the text corresponding to the "Solubility" column in your
dataframe::
style={"Solubility": lambda x: "color: red" if x < -5 else ""}
You can also style a whole cell using the ``__all__`` key, the
corresponding function then has access to all values for each cell::
style={"__all__": lambda x: "color: red" if x["Solubility"] < -5 else ""}
Parameters: Customization
-------------------------
name : str, default="default"
Name of the grid. Used when retrieving selections from multiple grids
at the same time
rename : dict or None, default=None
Rename the properties in the final document.
custom_header : str or None, default=None
Custom libraries to be loaded in the header of the document.
callback : str, callable or None, default=None
Only available for the "interactive" template.
JavaScript or Python callback to be executed when clicking on an image.
A dictionnary containing the data for the full cell is directly available
as ``data`` in JS. For Python, the callback function must have ``data``
as the first argument to the function. All the values in the ``data`` dict
are parsed as strings, except "mols2grid-id" which is always an integer.
Note that fields containing spaces in their name will be replaced by
hyphens, i.e. "mol weight" becomes available as ``data["mol-weight"]``.
Returns
-------
view : IPython.core.display.HTML
Notes
-----
You can also directly use RDKit's
:class:`~rdkit.Chem.Draw.rdMolDraw2D.MolDrawOptions` parameters as arguments.
Additionally, ``atomColourPalette`` is available to customize the atom
palette if you're not prerendering image (``prerender=False``).
.. versionadded:: 0.1.0
Added ``sort_by``, ``custom_css``, ``custom_header`` and ``callback``
arguments. Added the ability to style an entire cell with
``style={"__all__": <function>}``.
.. versionadded:: 0.2.0
Added ``substruct_highlight`` argument.
.. versionchanged:: 0.2.2
If both ``subset`` and ``tooltip`` are ``None``, the index and image
will be directly displayed on the grid while the remaining fields will
be in the tooltip.
.. versionchanged:: 1.0.0
``callback`` can now be a *lambda* function. If ``prerender=True``,
substructure highlighting will be automatically disabled if it wasn't
explicitely set to ``True`` instead of raising an error.
"""
raise TypeError(f"No display method registered for type {type(arg)!r}")
@display.register(DataFrame)
@display.register(dict)
def _(df, **kwargs):
template, kwargs, render_kwargs = _prepare_kwargs(kwargs, "display")
return MolGrid(df, **kwargs).display(template=template, **render_kwargs)
@display.register(str)
@display.register(Path)
def _(sdf, **kwargs):
template, kwargs, render_kwargs = _prepare_kwargs(kwargs, "display")
return MolGrid.from_sdf(sdf, **kwargs).display(template=template, **render_kwargs)
@display.register(Series)
@display.register(list)
@display.register(tuple)
def _(mols, **kwargs):
template, kwargs, render_kwargs = _prepare_kwargs(kwargs, "display")
return MolGrid.from_mols(mols, **kwargs).display(template=template, **render_kwargs)
[docs]@singledispatch
def save(arg, **kwargs): # noqa: ARG001
"""Generate an interactive grid of molecules and save it.
Parameters
----------
arg : pandas.DataFrame, SDF file or list of molecules
The input containing your molecules.
output : str
Name and path of the output document.
Notes
-----
See :func:`display` for the full list of arguments.
"""
raise TypeError(f"No save method registered for type {type(arg)!r}")
@save.register(DataFrame)
def _(df, **kwargs):
template, kwargs, render_kwargs = _prepare_kwargs(kwargs, "save")
output = kwargs.pop("output")
return MolGrid(df, **kwargs).save(output, template=template, **render_kwargs)
@save.register(str)
@save.register(Path)
def _(sdf, **kwargs):
template, kwargs, render_kwargs = _prepare_kwargs(kwargs, "save")
output = kwargs.pop("output")
return MolGrid.from_sdf(sdf, **kwargs).save(
output, template=template, **render_kwargs
)
@save.register(Series)
@save.register(list)
@save.register(tuple)
def _(mols, **kwargs):
template, kwargs, render_kwargs = _prepare_kwargs(kwargs, "save")
output = kwargs.pop("output")
return MolGrid.from_mols(mols, **kwargs).save(
output, template=template, **render_kwargs
)