Other

A collection of common functions for basic MD process: supercell, read and write POSCAR, PDF, XYZ, progressbar, replace_in_file, read_ORCA

`evaluate_linear_fit_np(x, y)`

Evaluate a simple linear fit.

Parameters:

Name	Type	Description	Default
`x`	`ndarray`	Independent variable values.	required
`y`	`ndarray`	Dependent variable values.	required

Returns:

Type	Description
`tuple[float, float]`	Coefficient of determination (R^2) and mean squared error.

Source code in m2dtools/other/common.py

def evaluate_linear_fit_np(x, y):
    """Evaluate a simple linear fit.

    Parameters
    ----------
    x : numpy.ndarray
        Independent variable values.
    y : numpy.ndarray
        Dependent variable values.

    Returns
    -------
    tuple[float, float]
        Coefficient of determination (R^2) and mean squared error.
    """
    # Fit a linear model
    coefficients = np.polyfit(x, y, 1)
    polynomial = np.poly1d(coefficients)

    # Predict y values
    y_pred = polynomial(x)

    # Calculate R2 score
    ss_res = np.sum((y - y_pred) ** 2)  # MSE
    ss_tot = np.sum((y - np.mean(y)) ** 2)
    r2 = 1 - (ss_res / ss_tot)

    return r2, np.sqrt(ss_res)

`pdf_sq_1type(box, natom, type_atom, coors, r_cutoff=10, delta_r=0.01)`

Compute pair distribution and structure factors for a single species.

Parameters:

Name	Type	Description	Default
`box`	`ndarray`	Simulation box matrix.	required
`natom`	`int`	Total number of atoms.	required
`type_atom`	`array - like`	Atom type identifiers.	required
`coors`	`ndarray`	Cartesian coordinates.	required
`r_cutoff`	`float`	Maximum distance for the radial distribution function.	`10`
`delta_r`	`float`	Bin width for the radial distribution function.	`0.01`

Returns:

Type	Description
`tuple[ndarray, ndarray, ndarray, ndarray]`	Radial positions, pair distribution function, q values and structure factor for the single-species system.

Source code in m2dtools/other/common.py

def pdf_sq_1type(box, natom, type_atom, coors, r_cutoff=10, delta_r=0.01):
    """Compute pair distribution and structure factors for a single species.

    Parameters
    ----------
    box : numpy.ndarray
        Simulation box matrix.
    natom : int
        Total number of atoms.
    type_atom : array-like
        Atom type identifiers.
    coors : numpy.ndarray
        Cartesian coordinates.
    r_cutoff : float, default 10
        Maximum distance for the radial distribution function.
    delta_r : float, default 0.01
        Bin width for the radial distribution function.

    Returns
    -------
    tuple[numpy.ndarray, numpy.ndarray, numpy.ndarray, numpy.ndarray]
        Radial positions, pair distribution function, q values and structure
        factor for the single-species system.
    """
    type_atom = np.array(type_atom)
    n1 = natom
    rcoors = np.dot(coors, np.linalg.inv(box))
    rdis = np.zeros([natom, natom, 3])
    for i in range(natom):
        tmp = rcoors[i]
        rdis[i, :, :] = tmp - rcoors
    rdis[rdis < -0.5] = rdis[rdis < -0.5] + 1
    rdis[rdis > 0.5] = rdis[rdis > 0.5] - 1
    a = np.dot(rdis[:, :, :], box)
    dis = np.sqrt((np.square(a[:, :, 0]) + np.square(a[:, :, 1]) + np.square(a[:, :, 2])))
    r_max = r_cutoff
    r = np.linspace(delta_r, r_max, int(r_max / delta_r))
    V = np.dot(np.cross(box[1, :], box[2, :]), box[0, :])
    rho1 = n1 / V
    c = np.array([rho1 * rho1]) * V
    g1 = np.histogram(dis[:n1, :n1], bins=r)[0] / (4 * np.pi * (r[1:] - delta_r / 2) ** 2 * delta_r * c[0])
    R = r[1:] - delta_r / 2

    dq = 0.01
    qrange = [np.pi / 2 / r_max, 25]
    Q = np.arange(np.floor(qrange[0] / dq), np.floor(qrange[1] / dq), 1) * dq
    S1 = np.zeros([len(Q)])
    rho = natom / np.dot(np.cross(box[1, :], box[2, :]), box[0, :]) / 10 ** 3
    # use a window function for fourier transform
    for i in np.arange(len(Q)):
        S1[i] = 1 + 4 * np.pi * rho / Q[i] * np.trapz(
            (g1 - 1) * np.sin(Q[i] * R) * R * np.sin(np.pi * R / r_max) / (np.pi * R / r_max), R)

    return R, g1, Q, S1

`read_pos(file_name)`

Read a VASP POSCAR structure.

Parameters:

Name	Type	Description	Default
`file_name`	`str`	Path to the POSCAR file.	required

Returns:

Type	Description
`tuple[ndarray, ndarray, ndarray, ndarray]`	Box matrix, atomic species, species counts and Cartesian coordinates.

Source code in m2dtools/other/common.py

def read_pos(file_name):
    """Read a VASP POSCAR structure.

    Parameters
    ----------
    file_name : str
        Path to the POSCAR file.

    Returns
    -------
    tuple[numpy.ndarray, numpy.ndarray, numpy.ndarray, numpy.ndarray]
        Box matrix, atomic species, species counts and Cartesian coordinates.
    """
    f = open(file_name, 'r')
    lf = list(f)
    f.close()
    box = np.zeros((3, 3))
    ratio = float(lf[1].split()[0])
    box[0, :] = np.array(lf[2].split()).astype(float)*ratio
    box[1, :] = np.array(lf[3].split()).astype(float)*ratio
    box[2, :] = np.array(lf[4].split()).astype(float)*ratio
    a_type = np.array(lf[5].split())
    num_type = np.array(lf[6].split()).astype(int)

    natom = np.sum(num_type)
    coors = np.zeros((natom, 3))

    if lf[7].split()[0][0] == 'C' or lf[7].split()[0][0] == 'c':
        print('Cartesian coordinates detected in POSCAR.')
        l = 0
        for ia in lf[8:8+natom]:
            coors[l, :] = np.array(ia.split()[0:3:1]).astype('float')
            l += 1

    if lf[7].split()[0][0] == 'D' or lf[7].split()[0][0] == 'd':
        l = 0
        rcoors = np.zeros((natom, 3))
        for ia in lf[8:8+natom]:
            rcoors[l, :] = np.array(ia.split()[0:3:1]).astype('float')
            l += 1
        coors = rcoors @ box
    else:
        print('Error: only Cartesian or Direct coordinates are supported in POSCAR!')

    return box, a_type, num_type, coors

`read_xyz_simple(filename)`

Read an extended XYZ file. Returns: types : (N,) array of strings coords : (N,3) float array lattice: (3,3) float array (box matrix)

Source code in m2dtools/other/common.py

def read_xyz_simple(filename):
    """
    Read an extended XYZ file.
    Returns:
        types  : (N,) array of strings
        coords : (N,3) float array
        lattice: (3,3) float array  (box matrix)
    """
    with open(filename, "r") as f:
        # --- first line: number of atoms ---
        natoms = int(f.readline().strip())

        # --- second line: comment, possibly containing Lattice="..." ---
        comment = f.readline().strip()

        # --- parse Lattice="..." if present ---
        lattice = np.eye(3)
        m = re.search(r'Lattice="([^"]+)"', comment)
        if m:
            nums = list(map(float, m.group(1).split()))
            if len(nums) != 9:
                raise ValueError("Lattice must contain 9 numbers.")
            lattice = np.array(nums).reshape(3, 3)

        # --- read atoms ---
        types = []
        coords = []
        for _ in range(natoms):
            line = f.readline().strip()
            if not line:
                raise ValueError("Unexpected EOF while reading atoms.")

            parts = line.split()
            if len(parts) < 4:
                continue

            types.append(parts[0])
            coords.append([float(parts[1]), float(parts[2]), float(parts[3])])

    return np.array(types), np.array(coords, float), lattice

`replace_in_file(file_path_old, file_path_new, old_string, new_string)`

Replace text within a file and write the updated copy.

Parameters:

Name	Type	Description	Default
`file_path_old`	`str`	Source file to read.	required
`file_path_new`	`str`	Destination path for the updated content.	required
`old_string`	`str`	Text to be replaced.	required
`new_string`	`str`	Replacement text.	required

Returns:

Type	Description
`None`	Writes `file_path_new` with updated contents.

Source code in m2dtools/other/common.py

def replace_in_file(file_path_old, file_path_new, old_string, new_string):
    """Replace text within a file and write the updated copy.

    Parameters
    ----------
    file_path_old : str
        Source file to read.
    file_path_new : str
        Destination path for the updated content.
    old_string : str
        Text to be replaced.
    new_string : str
        Replacement text.

    Returns
    -------
    None
        Writes ``file_path_new`` with updated contents.
    """
    try:
        # Read the content of the file
        with open(file_path_old, 'r') as file:
            content = file.read()

        # Replace old_string with new_string
        modified_content = content.replace(old_string, new_string)

        # Write the modified content back to the file
        with open(file_path_new, 'w') as file:
            file.write(modified_content)

        print("File updated successfully.")
    except IOError as e:
        print(f"An error occurred: {e}")

`supercell(natoms, box0, nx, ny, nz, index0, atom_type0, coors0)`

Build a replicated supercell from an orthogonal unit cell.

Parameters:

Name	Type	Description	Default
`natoms`	`int`	Number of atoms in the original cell.	required
`box0`	`ndarray`	`(3, 3)` box matrix for the original cell.	required
`nx`	`int`	Replication counts along each lattice vector.	required
`ny`	`int`	Replication counts along each lattice vector.	required
`nz`	`int`	Replication counts along each lattice vector.	required
`index0`	`ndarray`	Atom indices for the original cell.	required
`atom_type0`	`ndarray`	Atom types for the original cell.	required
`coors0`	`ndarray`	Cartesian coordinates for the original cell.	required

Returns:

Type	Description
`tuple`	`(natoms_new, box_new, index_new, atom_type_new, coors_new)` for the replicated supercell.

Source code in m2dtools/other/common.py

def supercell(natoms, box0, nx, ny, nz, index0, atom_type0, coors0):
    """Build a replicated supercell from an orthogonal unit cell.

    Parameters
    ----------
    natoms : int
        Number of atoms in the original cell.
    box0 : numpy.ndarray
        ``(3, 3)`` box matrix for the original cell.
    nx, ny, nz : int
        Replication counts along each lattice vector.
    index0 : numpy.ndarray
        Atom indices for the original cell.
    atom_type0 : numpy.ndarray
        Atom types for the original cell.
    coors0 : numpy.ndarray
        Cartesian coordinates for the original cell.

    Returns
    -------
    tuple
        ``(natoms_new, box_new, index_new, atom_type_new, coors_new)`` for the
        replicated supercell.
    """

    box_new = box0@np.array([[nx, 0, 0], [0, ny, 0], [0, 0, nz]])
    natoms_new = natoms*nx*ny*nz

    # coors_new = np.empty([1,3])
    # index_new = np.empty

    for ix in range(nx):
        for iy in range(ny):
            for iz in range(nz):
                if ix+iy+iz == 0:
                    coors_new = coors0
                    atom_type_new = atom_type0
                    index_new = index0
                    index_tmp = index0
                else:
                    coors_tmp = coors0 + ix*box0[0, :] + iy*box0[1, :] + iz*box0[2, :]
                    coors_new = np.vstack((coors_new, coors_tmp))

                    atom_type_new = np.concatenate((atom_type_new, atom_type0))
                    index_tmp = index_tmp + natoms
                    index_new = np.concatenate((index_new, index_tmp))

    return natoms_new, box_new, index_new, atom_type_new, coors_new

`write_pos(file_name, box, a_type, num_type, coors)`

Write a VASP POSCAR structure.

Parameters:

Name	Type	Description	Default
`file_name`	`str`	Destination POSCAR path.	required
`box`	`ndarray`	`(3, 3)` lattice matrix.	required
`a_type`	`array - like`	Sequence of element symbols.	required
`num_type`	`array - like`	Number of atoms for each element.	required
`coors`	`ndarray`	Cartesian coordinates for all atoms.	required

Returns:

Type	Description
`None`	The POSCAR file is written to `file_name`.

Source code in m2dtools/other/common.py

def write_pos(file_name, box, a_type, num_type, coors):
    """Write a VASP POSCAR structure.

    Parameters
    ----------
    file_name : str
        Destination POSCAR path.
    box : numpy.ndarray
        ``(3, 3)`` lattice matrix.
    a_type : array-like
        Sequence of element symbols.
    num_type : array-like
        Number of atoms for each element.
    coors : numpy.ndarray
        Cartesian coordinates for all atoms.

    Returns
    -------
    None
        The POSCAR file is written to ``file_name``.
    """
    f = open(file_name, 'w')
    f.write('written by python script\n')
    f.write('1.0\n')

    for i in range(3):
        f.write('{0:20.12f}{1:20.12f}{2:20.12f}\n'.format(box[i, 0], box[i, 1], box[i, 2]))

    for i in range(len(a_type)):
        f.write(' {}'.format(a_type[i]))
    f.write('\n')
    for i in range(len(a_type)):
        f.write(' {}'.format(num_type[i]))
    f.write('\n')

    natom = np.sum(num_type)
    f.write('C\n')
    for i in range(natom):
        f.write('{0:20.12f}{1:20.12f}{2:20.12f}\n'.format(coors[i, 0], coors[i, 1], coors[i, 2]))

    f.close()

`write_xyz_file(atom_types, coordinates, filename, comment='')`

Write an XYZ file from atom types and coordinates.

Parameters:

Name	Type	Description	Default
`atom_types`	`list[str]`	Atom types or symbols.	required
`coordinates`	`list[tuple[float, float, float]]`	Cartesian coordinates for each atom.	required
`filename`	`str`	Path to the output XYZ file.	required
`comment`	`str`	Comment to include on the second line of the file.	`""`

Returns:

Type	Description
`None`	The XYZ file is written to `filename`.

Source code in m2dtools/other/common.py

def write_xyz_file(atom_types, coordinates, filename, comment=""):
    """Write an XYZ file from atom types and coordinates.

    Parameters
    ----------
    atom_types : list[str]
        Atom types or symbols.
    coordinates : list[tuple[float, float, float]]
        Cartesian coordinates for each atom.
    filename : str
        Path to the output XYZ file.
    comment : str, default ""
        Comment to include on the second line of the file.

    Returns
    -------
    None
        The XYZ file is written to ``filename``.
    """
    num_atoms = len(atom_types)
    with open(filename, 'w') as file:
        file.write(f"{num_atoms}\n")
        file.write(f"{comment}\n")
        for atom_type, (x, y, z) in zip(atom_types, coordinates):
            file.write(f"{atom_type} {x:.6f} {y:.6f} {z:.6f}\n")

Tools for reading and writing .gro files

`gro2pos(posfile, grofile)`

Convert a .gro file to a POSCAR structure.

Parameters:

Name	Type	Description	Default
`posfile`	`str`	Destination POSCAR file path.	required
`grofile`	`str`	Source `.gro` trajectory file.	required

Returns:

Type	Description
`None`	Writes the POSCAR representation to `posfile`.

Source code in m2dtools/other/tools_gro.py

def gro2pos(posfile, grofile):
    """Convert a ``.gro`` file to a POSCAR structure.

    Parameters
    ----------
    posfile : str
        Destination POSCAR file path.
    grofile : str
        Source ``.gro`` trajectory file.

    Returns
    -------
    None
        Writes the POSCAR representation to ``posfile``.
    """
    box, natom, type_atom, coors0 = read_gro('{}'.format(grofile))

    elements = list(set(type_atom))
    n_elements = len(elements)

    n_atom = []
    id_atom = []
    for i_e in range(n_elements):
        id_atom.append(np.array(np.where(type_atom == elements[i_e]))[0])
        n_atom.append(id_atom[i_e].shape[0])

    f1 = open('{}'.format(posfile), 'w')
    f1.write('generated by gro2pos\n')
    f1.write(' 1.0\n')
    for ib in range(3):
        f1.write(' {0:20.12f} {1:20.12f} {2:20.12f}\n'.format(10*box[ib, 0], 10*box[ib, 1], 10*box[ib, 2]))

    for i_e in range(n_elements):
        f1.write(' {}'.format(elements[i_e]))
    f1.write('\n')

    for i_e in range(n_elements):
        f1.write(' {0:8d}'.format(n_atom[i_e]))
    f1.write('\n')
    f1.write('C\n')
    for i_e in range(n_elements):
        for ic in range(n_atom[i_e]):
            f1.write(' {0:20.12f} {1:20.12f} {2:20.12f}\n'.format(10*coors0[id_atom[i_e][ic], 0], 10*coors0[id_atom[i_e][ic], 1], 10*coors0[id_atom[i_e][ic], 2]))

    f1.close()

`read_gro(file_name)`

Read a GROMACS .gro file.

Parameters:

Name	Type	Description	Default
`file_name`	`str`	Path to the `.gro` file.	required

Returns:

Type	Description
`tuple[ndarray, int, ndarray, ndarray]`	Box matrix, atom count, atom types and coordinates.

Source code in m2dtools/other/tools_gro.py

def read_gro(file_name):
    """Read a GROMACS ``.gro`` file.

    Parameters
    ----------
    file_name : str
        Path to the ``.gro`` file.

    Returns
    -------
    tuple[numpy.ndarray, int, numpy.ndarray, numpy.ndarray]
        Box matrix, atom count, atom types and coordinates.
    """
    f = open(file_name, 'r')
    lf = list(f)
    f.close()
    len1 = float(lf[-1].split()[0])
    len2 = float(lf[-1].split()[1])
    len3 = float(lf[-1].split()[2])
    box = np.diag([len1, len2, len3])
    natom = int(lf[1])
    coors = np.zeros([natom, 3])
    type_atom = []
    l = 0
    for ia in lf[2:2+natom]:
        if l < 9999:
            coors[l, :] = np.array(ia.split()[3:6:1]).astype('float')
            type_atom.append(ia.split()[1])
        else:
            coors[l, :] = np.array(ia.split()[2:5:1]).astype('float')
            tmp = ia.split()[1]
            type_atom.append(re.findall(r'(\w+?)(\d+)', tmp)[0][0])
        l += 1

    type_atom = np.array(type_atom)
    return box, natom, type_atom, coors

`read_gro_multi(gro_file)`

Read multiple frames from a concatenated .gro file.

Parameters:

Name	Type	Description	Default
`gro_file`	`str`	Path to the multi-frame `.gro` file.	required

Returns:

Type	Description
`tuple[list, list]`	List of frame tuples `(box, natom, type_atom, coors)` and the corresponding timestep labels.

Source code in m2dtools/other/tools_gro.py

def read_gro_multi(gro_file):
    """Read multiple frames from a concatenated ``.gro`` file.

    Parameters
    ----------
    gro_file : str
        Path to the multi-frame ``.gro`` file.

    Returns
    -------
    tuple[list, list]
        List of frame tuples ``(box, natom, type_atom, coors)`` and the
        corresponding timestep labels.
    """

    f = open(gro_file)
    lft = list(f)
    f.close()
    lt = []
    t = []
    for il in range(len(lft)):
        if 't=' in lft[il]:
            lt.append(il)
            t.append(lft[il].split()[2])

    def read_lf(lf):
        len1 = float(lf[-1].split()[0])
        len2 = float(lf[-1].split()[1])
        len3 = float(lf[-1].split()[2])
        box = np.diag([len1, len2, len3])
        natom = int(lf[1])
        coors = np.zeros([natom, 3])
        type_atom = []
        l = 0
        for ia in lf[2:2+natom]:
            if l < 9999:
                coors[l, :] = np.array(ia.split()[3:6:1]).astype('float')
                type_atom.append(ia.split()[1])
            else:
                coors[l, :] = np.array(ia.split()[2:5:1]).astype('float')
                tmp = ia.split()[1]
                type_atom.append(re.findall(r'(\w+?)(\d+)', tmp)[0][0])
            l += 1

        type_atom = np.array(type_atom)
        return box, natom, type_atom, coors

    # lf=[]
    result = []
    for it in range(len(lt)):
        if it == len(lt)-1:
            #         lf.append(lft[lt[it]:])
            result.append(read_lf(lft[lt[it]:]))
        else:
            #         lf.append(lft[lt[it]:lt[it+1]-1])
            result.append(read_lf(lft[lt[it]:lt[it+1]]))

    return result, t

`write_gro(filename, box, natom, type_atom, coors)`

Write a GROMACS .gro file.

Parameters:

Name	Type	Description	Default
`filename`	`str`	Output file name without extension.	required
`box`	`ndarray`	`(3, 3)` box matrix (orthogonal only).	required
`natom`	`int`	Number of atoms.	required
`type_atom`	`array - like`	Atom type identifiers.	required
`coors`	`ndarray`	Cartesian coordinates for each atom.	required

Returns:

Type	Description
`None`	Writes `filename.gro` to disk.

Source code in m2dtools/other/tools_gro.py

def write_gro(filename, box, natom, type_atom, coors):
    """Write a GROMACS ``.gro`` file.

    Parameters
    ----------
    filename : str
        Output file name without extension.
    box : numpy.ndarray
        ``(3, 3)`` box matrix (orthogonal only).
    natom : int
        Number of atoms.
    type_atom : array-like
        Atom type identifiers.
    coors : numpy.ndarray
        Cartesian coordinates for each atom.

    Returns
    -------
    None
        Writes ``filename.gro`` to disk.
    """
    f = open('{}.gro'.format(filename), 'w')
    f.write('SiO2\n')
    f.write('{0:5d} \n'.format(natom))
    for i in range(natom):
        if i < 9999:
            f.write('{0:5d}SIO     {1:s}{2:5d}{3:8.3f}{4:8.3f}{5:8.3f}{6:8.4f}{7:8.4f}{8:8.4f}\n'.format(i+1, type_atom[i], i+1, coors[i, 0], coors[i, 1], coors[i, 2], 0, 0, 0))
        else:
            f.write('{0:5d}SIO     {1:s}{2:6d}{3:8.3f}{4:8.3f}{5:8.3f}{6:8.4f}{7:8.4f}{8:8.4f}\n'.format(i+1, type_atom[i], i+1, coors[i, 0], coors[i, 1], coors[i, 2], 0, 0, 0))
    f.write('{0:10.5f}{1:10.5f}{2:10.5f}'.format(box[0, 0], box[1, 1], box[2, 2]))  # only work for othorgonal boxes
    f.close()