Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

WaterBridge interaction #229

Open
wants to merge 15 commits into
base: master
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion .github/workflows/ci.yml
Original file line number Diff line number Diff line change
Expand Up @@ -64,7 +64,7 @@ jobs:
python-version: ${{ matrix.python-version }}
auto-update-conda: true
use-mamba: true
miniforge-variant: Mambaforge
miniforge-variant: Miniforge3

- name: Check conda and pip
run: |
Expand Down
9 changes: 3 additions & 6 deletions docs/notebooks/docking.ipynb
Original file line number Diff line number Diff line change
Expand Up @@ -609,7 +609,7 @@
"ref_mol = plf.Molecule.from_mda(ref)\n",
"\n",
"# generate IFP for the reference\n",
"fp_ref = plf.Fingerprint(fp.interactions)\n",
"fp_ref = plf.Fingerprint(list(fp.interactions))\n",
"fp_ref.run_from_iterable([ref_mol], protein_mol)\n",
"df_ref = fp_ref.to_dataframe(index_col=\"Pose\")\n",
"\n",
Expand Down Expand Up @@ -853,11 +853,8 @@
}
],
"metadata": {
"interpreter": {
"hash": "8787e9fc73b27535744a25d17e74686c0add9df598b8e27ca04412fce7f0c7ae"
},
"kernelspec": {
"display_name": "Python 3.8.5 ('prolif')",
"display_name": "prolif",
"language": "python",
"name": "python3"
},
Expand All @@ -871,7 +868,7 @@
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.9.13"
"version": "3.11.9"
}
},
"nbformat": 4,
Expand Down
104,651 changes: 104,651 additions & 0 deletions prolif/data/water_m2.pdb

Large diffs are not rendered by default.

Binary file added prolif/data/water_m2.xtc
Binary file not shown.
119 changes: 103 additions & 16 deletions prolif/fingerprint.py
Original file line number Diff line number Diff line change
Expand Up @@ -29,16 +29,22 @@
import warnings
from collections.abc import Sized
from functools import wraps
from inspect import signature
from typing import Literal, Optional, Tuple, Union

import dill
import multiprocess as mp
import numpy as np
from MDAnalysis.converters.RDKit import atomgroup_to_mol, set_converter_cache_size
from rdkit import Chem
from tqdm.auto import tqdm

from prolif.ifp import IFP
from prolif.interactions.base import _BASE_INTERACTIONS, _INTERACTIONS
from prolif.interactions.base import (
_BASE_INTERACTIONS,
_BRIDGED_INTERACTIONS,
_INTERACTIONS,
)
from prolif.molecule import Molecule
from prolif.parallel import MolIterablePool, TrajectoryPool
from prolif.plotting.utils import IS_NOTEBOOK
Expand Down Expand Up @@ -206,19 +212,21 @@
"PiCation",
"VdWContact",
]
self.interactions = interactions
self.count = count
self._set_interactions(interactions, parameters)
self.vicinity_cutoff = vicinity_cutoff
self.parameters = parameters

def _set_interactions(self, interactions, parameters):
# read interactions to compute
parameters = parameters or {}
if interactions == "all":
interactions = self.list_available()

# sanity check
self._check_valid_interactions(interactions, "interactions")
self._check_valid_interactions(parameters, "parameters")

# add interaction methods
self.interactions = {}
wrapper = all_occurences if self.count else first_occurence
Expand All @@ -229,37 +237,67 @@
if name in interactions:
self.interactions[name] = wrapper(interaction)

# add bridged interactions
self.bridged_interactions = {}
for name, interaction_cls in _BRIDGED_INTERACTIONS.items():
if name in interactions:
params = parameters.get(name, {})
if not params:
raise ValueError(
f"Must specify settings for bridged interaction {name!r}: try "
f'`parameters={{"{name}": {{...}}}}`'
)
sig = signature(interaction_cls.__init__)
if "count" in sig.parameters:
params.setdefault("count", self.count)
interaction = interaction_cls(**params)
setattr(self, name.lower(), interaction)
self.bridged_interactions[name] = interaction

def _check_valid_interactions(self, interactions_iterable, varname):
"""Raises a NameError if an unknown interaction is given."""
unsafe = set(interactions_iterable)
unknown = unsafe.symmetric_difference(_INTERACTIONS.keys()) & unsafe
known = {*_INTERACTIONS, *_BRIDGED_INTERACTIONS}
unknown = unsafe.difference(known)
if unknown:
raise NameError(
f"Unknown interaction(s) in {varname!r}: {', '.join(unknown)}",
)

def __repr__(self): # pragma: no cover
name = ".".join([self.__class__.__module__, self.__class__.__name__])
params = f"{self.n_interactions} interactions: {list(self.interactions.keys())}"
params = f"{self.n_interactions} interactions: {self._interactions_list}"
return f"<{name}: {params} at {id(self):#x}>"

@staticmethod
def list_available(show_hidden=False):
def list_available(show_hidden=False, show_bridged=False):
"""List interactions available to the Fingerprint class.

Parameters
----------
show_hidden : bool
Show hidden classes (base classes meant to be inherited from to create
custom interactions).
show_bridged : bool
Show bridged interaction classes such as ``WaterBridge``.
"""
interactions = sorted(_INTERACTIONS)
if show_bridged:
interactions.extend(sorted(_BRIDGED_INTERACTIONS))

Check warning on line 286 in prolif/fingerprint.py

View check run for this annotation

Codecov / codecov/patch

prolif/fingerprint.py#L286

Added line #L286 was not covered by tests
if show_hidden:
return sorted(_BASE_INTERACTIONS) + sorted(_INTERACTIONS)
return sorted(_INTERACTIONS)
return sorted(_BASE_INTERACTIONS) + interactions
return interactions

@property
def _interactions_list(self):
interactions = list(self.interactions)
if self.bridged_interactions:
interactions.extend(self.bridged_interactions)

Check warning on line 295 in prolif/fingerprint.py

View check run for this annotation

Codecov / codecov/patch

prolif/fingerprint.py#L295

Added line #L295 was not covered by tests
return interactions

@property
def n_interactions(self):
return len(self.interactions)
return len(self._interactions_list)

def bitvector(self, res1, res2):
"""Generates the complete bitvector for the interactions between two
Expand Down Expand Up @@ -473,22 +511,54 @@
if converter_kwargs is not None and len(converter_kwargs) != 2:
raise ValueError("converter_kwargs must be a list of 2 dicts")

# setup defaults
converter_kwargs = converter_kwargs or ({}, {})
if (
self.bridged_interactions
and (maxsize := atomgroup_to_mol.cache_parameters()["maxsize"])
and maxsize <= 2
):
set_converter_cache_size(2 + len(self.bridged_interactions))
if n_jobs is None:
n_jobs = int(os.environ.get("PROLIF_N_JOBS", "0")) or None
if residues == "all":
residues = list(Molecule.from_mda(prot, **converter_kwargs[1]).residues)
if n_jobs != 1:
return self._run_parallel(

if self.interactions:
if n_jobs == 1:
ifp = self._run_serial(
traj,
lig,
prot,
residues=residues,
converter_kwargs=converter_kwargs,
progress=progress,
)
else:
ifp = self._run_parallel(
traj,
lig,
prot,
residues=residues,
converter_kwargs=converter_kwargs,
progress=progress,
n_jobs=n_jobs,
)
self.ifp = ifp

if self.bridged_interactions:
self._run_bridged_analysis(
traj,
lig,
prot,
residues=residues,
converter_kwargs=converter_kwargs,
progress=progress,
n_jobs=n_jobs,
)
return self

def _run_serial(self, traj, lig, prot, *, residues, converter_kwargs, progress):
"""Serial implementation for trajectories."""
iterator = tqdm(traj) if progress else traj
ifp = {}
for ts in iterator:
Expand All @@ -500,8 +570,7 @@
residues=residues,
metadata=True,
)
self.ifp = ifp
return self
return ifp

def _run_parallel(
self,
Expand Down Expand Up @@ -537,8 +606,7 @@
for ifp_data_chunk in pool.process(args_iterable):
ifp.update(ifp_data_chunk)

self.ifp = ifp
return self
return ifp

def run_from_iterable(
self,
Expand Down Expand Up @@ -660,6 +728,25 @@
self.ifp = ifp
return self

def _run_bridged_analysis(self, traj, lig, prot, **kwargs):
"""Implementation of the WaterBridge analysis for trajectories.

Parameters
----------
traj : MDAnalysis.coordinates.base.ProtoReader or MDAnalysis.coordinates.base.FrameIteratorSliced
Iterate over this Universe trajectory or sliced trajectory object
to extract the frames used for the fingerprint extraction
lig : MDAnalysis.core.groups.AtomGroup
An MDAnalysis AtomGroup for the ligand
prot : MDAnalysis.core.groups.AtomGroup
An MDAnalysis AtomGroup for the protein (with multiple residues)
""" # noqa: E501
self.ifp = getattr(self, "ifp", {})
for interaction in self.bridged_interactions.values():
interaction.setup(ifp_store=self.ifp, **kwargs)
interaction.run(traj, lig, prot)
return self

def to_dataframe(
self,
*,
Expand Down Expand Up @@ -715,7 +802,7 @@
if hasattr(self, "ifp"):
return to_dataframe(
self.ifp,
self.interactions,
self._interactions_list,
count=self.count if count is None else count,
dtype=dtype,
drop_empty=drop_empty,
Expand Down
1 change: 1 addition & 0 deletions prolif/interactions/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -23,3 +23,4 @@
XBAcceptor,
XBDonor,
)
from prolif.interactions.water_bridge import WaterBridge
39 changes: 37 additions & 2 deletions prolif/interactions/base.py
Original file line number Diff line number Diff line change
Expand Up @@ -6,18 +6,21 @@
"""

import warnings
from abc import abstractmethod
from itertools import product
from math import degrees, radians

import numpy as np
from rdkit import Geometry
from rdkit.Chem import MolFromSmarts

from prolif.ifp import IFP
from prolif.interactions.utils import DISTANCE_FUNCTIONS, get_mapindex
from prolif.utils import angle_between_limits, get_centroid, get_ring_normal_vector

_INTERACTIONS = {}
_BASE_INTERACTIONS = {}
_INTERACTIONS: dict[str, type["Interaction"]] = {}
_BRIDGED_INTERACTIONS: dict[str, type["BridgedInteraction"]] = {}
_BASE_INTERACTIONS: dict[str, type["Interaction"]] = {}


class Interaction:
Expand Down Expand Up @@ -111,6 +114,38 @@
return inverted


class BridgedInteraction:
"""Base class for bridged interactions."""

def __init_subclass__(cls):
super().__init_subclass__()
name = cls.__name__
register = _BRIDGED_INTERACTIONS
if name in register:
warnings.warn(

Check warning on line 125 in prolif/interactions/base.py

View check run for this annotation

Codecov / codecov/patch

prolif/interactions/base.py#L125

Added line #L125 was not covered by tests
f"The {name!r} interaction has been superseded by a "
f"new class with id {id(cls):#x}",
stacklevel=2,
)
register[name] = cls

def __init__(self):
self.ifp = {}
# force empty setup to initialize args with defaults
self.setup()
Dismissed Show dismissed Hide dismissed

def setup(self, ifp_store=None, **kwargs) -> None:
"""Setup additional arguments passed at runtime to the fingerprint generator's
``run`` method.
"""
self.ifp = ifp_store if ifp_store is not None else {}
self.kwargs = kwargs

@abstractmethod
def run(self, traj, lig, prot) -> dict[int, IFP]:
raise NotImplementedError()


class Distance(Interaction, is_abstract=True):
"""Generic class for distance-based interactions

Expand Down
Loading
Loading