From a28b25aaaa2672b9f23609612ae832f6f09e381b Mon Sep 17 00:00:00 2001 From: Jimmy Shen <14003693+jmmshn@users.noreply.github.com> Date: Thu, 14 Dec 2023 15:53:34 -0800 Subject: [PATCH] More linting (#163) * notbooks: * linting * update configs * linting * linting * linting * linting * cover * lint * lint * lint * lint * lint * lint * lint * lint * lint * lint * lint --- pymatgen/analysis/defects/ccd.py | 1 - pymatgen/analysis/defects/core.py | 30 +++++++---- pymatgen/analysis/defects/finder.py | 43 ++++++++++++---- pymatgen/analysis/defects/generators.py | 18 ++++++- pymatgen/analysis/defects/plotting/optics.py | 53 ++++++++++++++++++-- pymatgen/analysis/defects/plotting/phases.py | 1 - pymatgen/analysis/defects/recombination.py | 19 ++++++- pymatgen/analysis/defects/supercells.py | 28 ++++++++--- pymatgen/analysis/defects/thermo.py | 32 ++++++++++-- pymatgen/analysis/defects/utils.py | 15 ++++-- 10 files changed, 196 insertions(+), 44 deletions(-) diff --git a/pymatgen/analysis/defects/ccd.py b/pymatgen/analysis/defects/ccd.py index 119088cf..01cc622e 100644 --- a/pymatgen/analysis/defects/ccd.py +++ b/pymatgen/analysis/defects/ccd.py @@ -380,7 +380,6 @@ def _get_ediff(self, output_order="skb") -> npt.NDArray: rearrangement here so that we have a single point of failure. Args: - band_structure: The band structure of the relaxed defect calculation. output_order: The order of the output. Defaults to "skb" (spin, kpoint, band]). You can also use "bks" (band, kpoint, spin). diff --git a/pymatgen/analysis/defects/core.py b/pymatgen/analysis/defects/core.py index ff82d4c0..ca075c97 100644 --- a/pymatgen/analysis/defects/core.py +++ b/pymatgen/analysis/defects/core.py @@ -18,6 +18,7 @@ from .utils import get_plane_spacing if TYPE_CHECKING: + from numpy.typing import ArrayLike from pymatgen.core import Structure from pymatgen.symmetry.structure import SymmetrizedStructure @@ -312,11 +313,7 @@ def _has_oxi(struct): @property def symmetrized_structure(self) -> SymmetrizedStructure: - """Returns the multiplicity of a defect site within the structure. - - This is required for concentration analysis and confirms that defect_site is a - site in bulk_structure. - """ + """Get the symmetrized version of the bulk structure.""" sga = SpacegroupAnalyzer( self.structure, symprec=self.symprec, angle_tolerance=self.angle_tolerance ) @@ -895,7 +892,19 @@ def get_vacancy(structure: Structure, isite: int, **kwargs) -> Vacancy: return Vacancy(structure=structure, site=site, **kwargs) -def _set_selective_dynamics(structure, site_pos, relax_radius): +def _set_selective_dynamics( + structure: Structure, site_pos: ArrayLike, relax_radius: float | str | None +): + """Set the selective dynamics behavior. + + Allow atoms to move for sites within a given radius of a given site, + all other atoms are fixed. Modify the structure in place. + + Args: + structure: The structure to set the selective dynamics. + site_pos: The center of the relaxation sphere. + relax_radius: The radius of the relaxation sphere. + """ if relax_radius is None: return if relax_radius == "auto": @@ -974,11 +983,15 @@ def _get_mapped_sites(uc_structure: Structure, sc_structure: Structure, r=0.001) return mapped_site_indices -def center_structure(structure, ref_fpos) -> Structure: +def center_structure(structure: Structure, ref_fpos: ArrayLike) -> Structure: """Shift the sites around a center. Move all the sites in the structure so that they are in the periodic image closest to the reference fractional position. + + Args: + structure: The structure to be centered. + ref_fpos: The reference fractional position that will be set to the center. """ struct = structure.copy() for idx, d_site in enumerate(struct): @@ -997,8 +1010,7 @@ def _get_el_changes_from_structures(defect_sc: Structure, bulk_sc: Structure) -> bulk_sc: The bulk structure. Returns: - str: The name of the defect, if the defect is a complex, the names of the - individual defects are separated by "+". + dict: A dictionary representing the species changes in creating the defect. """ def _check_int(n): diff --git a/pymatgen/analysis/defects/finder.py b/pymatgen/analysis/defects/finder.py index 1ee8a0d7..68c06e73 100644 --- a/pymatgen/analysis/defects/finder.py +++ b/pymatgen/analysis/defects/finder.py @@ -217,7 +217,7 @@ def get_site_groups(struct, symprec=0.01, angle_tolerance=5.0) -> List[SiteGroup return site_groups -def get_soap_vec(struct: "Structure") -> "NDArray": +def get_soap_vec(struct: "Structure") -> NDArray: """Get the SOAP vector for each site in the structure. Args: @@ -237,17 +237,32 @@ def get_soap_vec(struct: "Structure") -> "NDArray": return vecs -def get_site_vecs(struct: "Structure"): - """Get the SiteVec representation of each site in the structure.""" +def get_site_vecs(struct: Structure) -> List[SiteVec]: + """Get the SiteVec representation of each site in the structure. + + Args: + struct: Structure object to compute the site vectors (SOAP). + + Returns: + List[SiteVec]: List of SiteVec representing each site in the structure. + """ vecs = get_soap_vec(struct) - site_vecs = [] - for i, site in enumerate(struct): - site_vecs.append(SiteVec(species=site.species_string, site=site, vec=vecs[i])) - return site_vecs + return [ + SiteVec(species=site.species_string, site=site, vec=vecs[i]) + for i, site in enumerate(struct) + ] def cosine_similarity(vec1, vec2) -> float: - """Cosine similarity between two vectors.""" + """Cosine similarity between two vectors. + + Args: + vec1: First vector + vec2: Second vector + + Returns: + float: Cosine similarity between the two vectors + """ return np.dot(vec1, vec2) / (np.linalg.norm(vec1) * np.linalg.norm(vec2)) @@ -278,11 +293,19 @@ def best_match(sv: SiteVec, sgs: List[SiteGroup]) -> Tuple[SiteGroup, float]: return best_match, best_similarity -def _get_broundary(arr, n_max=16, n_skip=3): +def _get_broundary(arr, n_max=16, n_skip=3) -> int: """Get the boundary index for the high-distortion indices. Assuming arr is sorted in reverse order, find the biggest value drop in arr[n_skip:n_max]. + + Args: + arr: List of numbers + n_max: Maximum index to consider + n_skip: Number of indices to skip + + Returns: + int: The boundary index """ sub_arr = np.array(arr[n_skip:n_max]) diffs = sub_arr[1:] - sub_arr[:-1] @@ -291,7 +314,7 @@ def _get_broundary(arr, n_max=16, n_skip=3): def get_weighted_average_position( lattice: Lattice, frac_positions: ArrayLike, weights: ArrayLike | None = None -) -> "NDArray": +) -> NDArray: """Get the weighted average position of a set of positions in frac coordinates. The algorithm starts at position with the highest weight, and gradually moves diff --git a/pymatgen/analysis/defects/generators.py b/pymatgen/analysis/defects/generators.py index eb3a4ba2..faa702df 100644 --- a/pymatgen/analysis/defects/generators.py +++ b/pymatgen/analysis/defects/generators.py @@ -49,8 +49,20 @@ def _space_group_analyzer(self, structure: Structure) -> SpacegroupAnalyzer: "This generator is using the `SpaceGroupAnalyzer` and requires `symprec` and `angle_tolerance` to be set." ) + def generate(self, *args, **kwargs) -> Generator[Defect, None, None]: + """Generate a defect. + + Args: + *args: Additional positional arguments. + **kwargs: Additional keyword arguments. + + Returns: + Generator[Defect, None, None]: Generator that yields a list of ``Defect`` objects. + """ + raise NotImplementedError + def get_defects(self, *args, **kwargs) -> list[Defect]: - """Call the generator and convert the results into a list.""" + """Alias for self.generate.""" return list(self.generate(*args, **kwargs)) @@ -254,7 +266,7 @@ def generate( insertions: The insertions to be made given as a dictionary {"Mg": [[0.0, 0.0, 0.0], [0.5, 0.5, 0.5]]}. multiplicities: The multiplicities of the insertions to be made given as a dictionary {"Mg": [1, 2]}. equivalent_positions: The equivalent positions of the each inserted species given as a dictionary. - Note that they should typically be the same but we allow for more flexibility. + Note that they should typically be the same but we allow for more flexibility here. **kwargs: Additional keyword arguments for the ``Interstitial`` constructor. Returns: @@ -418,6 +430,8 @@ class ChargeInterstitialGenerator(InterstitialGenerator): min_dist: Minimum to atoms in the host structure avg_radius: The radius around each local minima used to evaluate the average charge. max_avg_charge: The maximum average charge to accept. + max_insertions: The maximum number of insertion sites to consider. + Will choose the sites with the lowest average charge. """ def __init__( diff --git a/pymatgen/analysis/defects/plotting/optics.py b/pymatgen/analysis/defects/plotting/optics.py index 01d27447..95fcc61f 100644 --- a/pymatgen/analysis/defects/plotting/optics.py +++ b/pymatgen/analysis/defects/plotting/optics.py @@ -183,7 +183,25 @@ def _plot_eigs( x_width: float = 0.3, **kwargs, ) -> None: - """Plot the eigenvalues.""" + """Plot the eigenvalues. + + Args: + d_eigs: + The dictionary of eigenvalues for the defect state. In the format of + (iband, ikpt, ispin) -> eigenvalue + e_fermi: + The bands above and below the Fermi level will be colored differently. + If not provided, they will all be colored the same. + ax: + The matplotlib axis object to plot on. + x0: + The x coordinate of the center of the set of lines representing the eigenvalues. + x_width: + The width of the set of lines representing the eigenvalues. + **kwargs: + Keyword arguments to pass to `matplotlib.pyplot.hlines`. + For example, `linestyles`, `alpha`, etc. + """ if ax is None: # pragma: no cover ax = plt.gca() @@ -215,7 +233,7 @@ def _plot_matrix_elements( arrow_width=0.1, cmap=None, norm=None, -): +) -> tuple[list[tuple], plt.cm, plt.Normalize]: """Plot arrow for the transition from the defect state to all other states. Args: @@ -242,13 +260,21 @@ def _plot_matrix_elements( The cartesian direction of the WAVDER tensor to sum over for the plot. If not provided, all the absolute values of the matrix for all three diagonal entries will be summed. + + Returns: + plot_data: + A list of tuples in the format of (iband, ikpt, ispin, eigenvalue, matrix element) + cmap: + The matplotlib color map used. + norm: + The matplotlib normalization used. """ if ax is None: # pragma: no cover ax = plt.gca() ax.set_aspect("equal") jb, jkpt, jspin = next(filter(lambda x: x[0] == defect_band_index, d_eig.keys())) y0 = d_eig[jb, jkpt, jspin] - plot_data = [] + plot_data: list[tuple] = [] for (ib, ik, ispin), eig in d_eig.items(): A = 0 for idir, jdir in ijdirs: @@ -289,8 +315,25 @@ def _plot_matrix_elements( return plot_data, cmap, norm -def _get_dataframe(d_eigs, me_plot_data) -> pd.DataFrame: - """Convert the eigenvalue and matrix element data into a pandas dataframe.""" +def _get_dataframe(d_eigs: dict, me_plot_data: list[tuple]) -> pd.DataFrame: + """Convert the eigenvalue and matrix element data into a pandas dataframe. + + Args: + d_eigs: + The dictionary of eigenvalues for the defect state. In the format of + (iband, ikpt, ispin) -> eigenvalue + me_plot_data: + A list of tuples in the format of (iband, ikpt, ispin, eigenvalue, matrix element) + + Returns: + A pandas dataframe with the following columns: + ib: The band index of the state the arrow is pointing to. + jb: The band index of the defect state. + kpt: The kpoint index of the state the arrow is pointing to. + spin: The spin index of the state the arrow is pointing to. + eig: The eigenvalue of the state the arrow is pointing to. + M.E.: The matrix element of the transition. + """ _, ikpt, ispin = next(iter(d_eigs.keys())) df = pd.DataFrame( me_plot_data, diff --git a/pymatgen/analysis/defects/plotting/phases.py b/pymatgen/analysis/defects/plotting/phases.py index 9a6a3a55..a97c0664 100644 --- a/pymatgen/analysis/defects/plotting/phases.py +++ b/pymatgen/analysis/defects/plotting/phases.py @@ -102,7 +102,6 @@ def _convex_hull_2d( points: list[dict], x_element: Element, y_element: Element, - tol: float = 0.001, competing_phases: list = None, ) -> list[dict]: """Compute the convex hull of a set of points in 2D. diff --git a/pymatgen/analysis/defects/recombination.py b/pymatgen/analysis/defects/recombination.py index 7d17085c..b4789645 100644 --- a/pymatgen/analysis/defects/recombination.py +++ b/pymatgen/analysis/defects/recombination.py @@ -30,7 +30,14 @@ @njit(cache=True) def fact(n: int) -> float: # pragma: no cover - """Compute the factorial of n.""" + """Compute the factorial of n. + + Args: + n: The number to compute the factorial of. + + Returns: + The factorial of n. + """ if n > 20: return LOOKUP_TABLE[-1] * np.prod( np.array(list(range(21, n + 1)), dtype=np.double) @@ -40,7 +47,15 @@ def fact(n: int) -> float: # pragma: no cover @njit(cache=True) def herm(x: float, n: int) -> float: # pragma: no cover - """Recursive definition of hermite polynomial.""" + """Recursive definition of hermite polynomial. + + Args: + x: The value to evaluate the hermite polynomial at. + n: The order of the hermite polynomial. + + Returns: + The value of the hermite polynomial at x. + """ if n == 0: return 1.0 if n == 1: diff --git a/pymatgen/analysis/defects/supercells.py b/pymatgen/analysis/defects/supercells.py index b63264ed..671ac855 100644 --- a/pymatgen/analysis/defects/supercells.py +++ b/pymatgen/analysis/defects/supercells.py @@ -12,7 +12,7 @@ # from pymatgen.io.ase import AseAtomsAdaptor if TYPE_CHECKING: - import numpy as np + from numpy.typing import ArrayLike, NDArray from pymatgen.core import Structure __author__ = "Jimmy-Xuan Shen" @@ -29,7 +29,7 @@ def get_sc_fromstruct( max_atoms: int = 240, min_length: float = 10.0, force_diagonal: bool = False, -) -> np.ndarray | np.array | None: +) -> NDArray | ArrayLike | None: """Generate the best supercell from a unitcell. The CubicSupercellTransformation from PMG is much faster but don't iterate over as @@ -92,7 +92,7 @@ def _cubic_cell( max_atoms: int = 240, min_length: float = 10.0, force_diagonal: bool = False, -) -> np.ndarray | None: +) -> NDArray | None: """Generate the best supercell from a unit cell. This is done using the pymatgen CubicSupercellTransformation class. @@ -125,23 +125,35 @@ def _cubic_cell( return cst.transformation_matrix -def _ase_cubic(base_struture, min_atoms: int = 80, max_atoms: int = 240): +def _ase_cubic(base_structure, min_atoms: int = 80, max_atoms: int = 240): + """Generate the best supercell from a unit cell. + + Use ASE's find_optimal_cell_shape function to find the best supercell. + + Args: + base_structure: structure of the unit cell + max_atoms: Maximum number of atoms allowed in the supercell. + min_atoms: Minimum number of atoms allowed in the supercell. + + Returns: + 3x3 matrix: supercell matrix + """ from ase.build import find_optimal_cell_shape, get_deviation_from_optimal_cell_shape from pymatgen.io.ase import AseAtomsAdaptor _logger.warn("ASE cubic supercell generation.") aaa = AseAtomsAdaptor() - ase_atoms = aaa.get_atoms(base_struture) - lower = math.ceil(min_atoms / base_struture.num_sites) - upper = math.floor(max_atoms / base_struture.num_sites) + ase_atoms = aaa.get_atoms(base_structure) + lower = math.ceil(min_atoms / base_structure.num_sites) + upper = math.floor(max_atoms / base_structure.num_sites) min_dev = (float("inf"), None) for size in range(lower, upper + 1): _logger.warn(f"Trying size {size} out of {upper}.") sc = find_optimal_cell_shape( ase_atoms.cell, target_size=size, target_shape="sc" ) - sc_cell = aaa.get_atoms(base_struture * sc).cell + sc_cell = aaa.get_atoms(base_structure * sc).cell deviation = get_deviation_from_optimal_cell_shape(sc_cell, target_shape="sc") min_dev = min(min_dev, (deviation, sc)) if min_dev[1] is None: diff --git a/pymatgen/analysis/defects/thermo.py b/pymatgen/analysis/defects/thermo.py index 94b40801..cf8cd898 100644 --- a/pymatgen/analysis/defects/thermo.py +++ b/pymatgen/analysis/defects/thermo.py @@ -69,7 +69,9 @@ class DefectEntry(MSONable): about how the corrections were calculated. These should are only used for debugging and plotting purposes. PLEASE DO NOT USE THIS AS A CONTAINER FOR IMPORTANT DATA. - + entry_id: + The entry_id for the defect entry. Usually the same as the entry_id of the + defect supercell entry. """ defect: Defect @@ -331,7 +333,8 @@ def with_atomic_entries( bulk_entry: The bulk computed entry to get the total energy of the bulk supercell. band_gap: - The band gap of the bulk crystal. + The band gap of the bulk crystal. Passed directly to the \ + FormationEnergyDiagram constructor. inc_inf_values: If False these boundary points at infinity are ignored when we look at the chemical potential limits. @@ -697,6 +700,14 @@ def with_atomic_entries( Initializes by grouping defect types, and creating a list of single FormationEnergyDiagram using the with_atomic_entries method (see above) + + Args: + bulk_entry: bulk entry + defect_entries: list of defect entries + atomic_entries: list of atomic entries + phase_diagram: phase diagram + vbm: valence band maximum for the bulk phase + **kwargs: additional kwargs for FormationEnergyDiagram """ single_form_en_diagrams = [] for _, defect_group in group_defect_entries(defect_entries=defect_entries): @@ -1030,7 +1041,11 @@ def fermi_dirac(energy: float, temperature: int | float) -> float: Gets the defects equilibrium concentration (up to the multiplicity factor) at a particular fermi level, chemical potential, and temperature (in Kelvin), - assuming dilue limit thermodynamics (non-interacting defects) using FD statistics. + assuming dilute limit thermodynamics (non-interacting defects) using FD statistics. + + Args: + energy: Energy of the defect with respect to the VBM. + temperature: Temperature in Kelvin. """ return 1.0 / (1.0 + np.exp((energy) / (boltzman_eV_K * temperature))) @@ -1244,6 +1259,17 @@ def plot_formation_energy_diagrams( def _get_line_color_and_style(colors=None, styles=None): + """Get a generator for colors and styles. + + Create an iterator that will cycle through the colors and styles. + + Args: + colors: List of colors to use, if None, use the default matplotlib colors. + styles: List of styles to use, if None, will use ["-", "--", "-.", ":"] + + Returns: + Generator of (color, style) tuples + """ if colors is None: colors = plt.rcParams["axes.prop_cycle"].by_key()["color"] if styles is None: diff --git a/pymatgen/analysis/defects/utils.py b/pymatgen/analysis/defects/utils.py index 79c9766b..43e34cd3 100644 --- a/pymatgen/analysis/defects/utils.py +++ b/pymatgen/analysis/defects/utils.py @@ -196,8 +196,18 @@ def generate_reciprocal_vectors_squared(a1, a2, a3, encut): yield np.dot(vec, vec) -def converge(f, step, tol, max_h): - """Simple newton iteration based convergence function.""" +def converge(f, step, tol, max_h) -> float: + """Simple newton iteration based convergence function. + + Args: + f: function to converge + step: step size for newton iteration + tol: tolerance for convergence + max_h: maximum value of h to try before giving up + + Returns: + converged value of f + """ g = f(0) dx = 10000 h = step @@ -843,7 +853,6 @@ def get_ipr_in_window( bandstructure: The bandstructure object. The band just below the fermi level is used as the center of band window. procar: The procar object. - k_index: The index of the k-point to use. If None, the IPR is averaged over all k-points. band_window: The number of bands above and blow the fermi level to include in the search window. Returns: