Source code for aim2dat.strct.ext_analysis.fragmentation

"""Module to find bonded molecular fragments in an extended structure."""

# Standard library imports
from typing import List

# Third party library imports
import numpy as np

# Internal library imports
from aim2dat.strct.strct import Structure
from aim2dat.strct.ext_analysis.decorator import external_analysis_method


[docs] @external_analysis_method def determine_molecular_fragments( structure: Structure, max_fragment_size: int = 100, exclude_elements: List[str] = None, exclude_sites: List[int] = None, end_point_elements: List[str] = None, **cn_kwargs, ) -> List[Structure]: """ Find molecular fragments in a larger molecule/cluster of periodic crystal. Parameters ---------- structure : aim2dat.strct.Structure Structure object. max_fragment_size : int Maximum size of the fragments to avoid recursion overflow. exclude_elements : list List of elements that are excluded from the search. exclude_sites : list List of site indices that are excluded from the search. end_point_elements : list List of elements that serve as an end point for a fragment. r_max : float (optional) Cut-off value for the maximum distance between two atoms in angstrom. cn_kwargs : Optional keyword arguments passed on to the ``calculate_coordination`` function. Returns ------- list List of fragments. """ if exclude_elements is None: exclude_elements = [] if exclude_sites is None: exclude_sites = [] if end_point_elements is None: end_point_elements = [] used_site_indices = [] molecular_fragments = [] coord = structure.calculate_coordination(**cn_kwargs) allowed_sites = [] for site_idx, el in enumerate(structure.elements): if site_idx not in exclude_sites and el not in exclude_elements: allowed_sites.append(site_idx) for site_idx in allowed_sites: if ( coord["sites"][site_idx]["element"] in end_point_elements or site_idx in used_site_indices ): continue mol_fragment = { "elements": [], "site_attributes": {"parent_indices": []}, "positions": [], "pbc": False, } _recursive_graph_builder( site_idx, mol_fragment, max_fragment_size, allowed_sites, end_point_elements, coord["sites"], np.array(structure.positions[site_idx]), ) if mol_fragment["elements"] != []: molecular_fragments.append(Structure(**mol_fragment)) used_site_indices += mol_fragment["site_attributes"]["parent_indices"] return None, molecular_fragments
def _recursive_graph_builder( site_idx, mol_fragment, max_fragment_size, allowed_sites, end_point_elements, sites, position, ): """ Find nearest neighbour of the first atom and adds it to the fragment. Take the neighbour of the neighbour and adds it to the fragment until all neighbours are found. """ # Conditions to be added to the fragment: if len(mol_fragment["elements"]) >= max_fragment_size: return None if site_idx in allowed_sites: # Steps: # 1) Check if site with same position is already in mol_fragment dictionary. for site_idx2, position2 in zip( mol_fragment["site_attributes"]["parent_indices"], mol_fragment["positions"] ): if site_idx == site_idx2 and np.linalg.norm(position - position2) < 1e-3: return None # 2) Update mol_fragment dictionary. element = sites[site_idx]["element"] mol_fragment["elements"].append(element) mol_fragment["site_attributes"]["parent_indices"].append(site_idx) mol_fragment["positions"].append(position.tolist()) shift = position - np.array(sites[site_idx]["position"]) if element not in end_point_elements: # 3) Iterate through neighbours and start graph builder with new index. for neighbour in sites[site_idx]["neighbours"]: _recursive_graph_builder( neighbour["site_index"], mol_fragment, max_fragment_size, allowed_sites, end_point_elements, sites, np.array(neighbour["position"]) + shift, )