Source code for sisl.io.siesta.binaries

# This Source Code Form is subject to the terms of the Mozilla Public
# License, v. 2.0. If a copy of the MPL was not distributed with this
# file, You can obtain one at https://mozilla.org/MPL/2.0/.
from numbers import Integral
from itertools import product
from collections import deque, namedtuple
import numpy as np
from numpy import pi

try:
    from . import _siesta
    found_module = True
except Exception as e:
    print(e)
    found_module = False

from ..sile import add_sile, SileError, SileWarning
from .sile import SileBinSiesta
from sisl._internal import set_module
from sisl.messages import info, warn, SislError

from ._help import *
import sisl._array as _a
from sisl import Geometry, Atom, Atoms, SuperCell, Grid, SparseCSR
from sisl import AtomicOrbital
from sisl.sparse import _ncol_to_indptr
from sisl.unit.siesta import unit_convert
from sisl.physics.sparse import SparseOrbitalBZ
from sisl.physics import Hamiltonian, DensityMatrix, EnergyDensityMatrix
from sisl.physics import BrillouinZone
from sisl.physics.overlap import Overlap
from sisl.physics.electron import EigenstateElectron


__all__ = ['tshsSileSiesta', 'onlysSileSiesta', 'tsdeSileSiesta']
__all__ += ['hsxSileSiesta', 'dmSileSiesta']
__all__ += ['wfsxSileSiesta']
__all__ += ['gridSileSiesta']
__all__ += ['tsgfSileSiesta']


_Bohr2Ang = unit_convert('Bohr', 'Ang')
_Ry2eV = unit_convert('Ry', 'eV')
_eV2Ry = unit_convert('eV', 'Ry')


def _toF(array, dtype, scale=None):
    if scale is None:
        return array.astype(dtype, order='F', copy=False)
    elif array.dtype == dtype and array.flags.f_contiguous:
        # no need to copy since the order is correct
        return array * scale

    # We have to handle cases
    out = np.empty_like(array, dtype, order='F')
    np.multiply(array, scale, out=out)
    return out


def _geometry_align(geom_b, geom_u, cls, method):
    """ Routine used to align two geometries

    There are a few twists in this since the fdf-reads will automatically
    try and pass a geometry from the output files.
    In cases where the *.ion* files are non-existing this will
    result in a twist.

    This routine will select and return a merged Geometry which
    fulfills the correct number of atoms and orbitals.

    However, if the input geometries have mis-matching number
    of atoms a SislError will be raised.

    Parameters
    ----------
    geom_b : Geometry from binary file
    geom_u : Geometry supplied by user

    Raises
    ------
    SislError
        if the geometries have non-equal atom count
    """
    if geom_b is None:
        return geom_u
    elif geom_u is None:
        return geom_b

    # Default to use the users geometry
    geom = geom_u

    is_copy = False
    def get_copy(geom, is_copy):
        if is_copy:
            return geom, True
        return geom.copy(), True

    if geom_b.na != geom.na:
        # we have no way of solving this issue...
        raise SileError(f"{cls.__name__}.{method} could not use the passed geometry as the "
                        f"of atoms is not consistent, user-atoms={geom_u.na}, file-atoms={geom_b.na}.")

    # Try and figure out what to do
    if not np.allclose(geom_b.xyz, geom.xyz):
        warn(f"{cls.__name__}.{method} has mismatched atomic coordinates, will copy geometry and use file XYZ.")
        geom, is_copy = get_copy(geom, is_copy)
        geom.xyz[:, :] = geom_b.xyz[:, :]
    if not np.allclose(geom_b.sc.cell, geom.sc.cell):
        warn(f"{cls.__name__}.{method} has non-equal lattice vectors, will copy geometry and use file lattice.")
        geom, is_copy = get_copy(geom, is_copy)
        geom.sc.cell[:, :] = geom_b.sc.cell[:, :]
    if not np.array_equal(geom_b.nsc, geom.nsc):
        warn(f"{cls.__name__}.{method} has non-equal number of supercells, will copy geometry and use file supercell count.")
        geom, is_copy = get_copy(geom, is_copy)
        geom.set_nsc(geom_b.nsc)

    # Now for the difficult part.
    # If there is a mismatch in the number of orbitals we will
    # prefer to use the user-supplied atomic species, but fill with
    # *random* orbitals
    if not np.array_equal(geom_b.atoms.orbitals, geom.atoms.orbitals):
        warn(f"{cls.__name__}.{method} has non-equal number of orbitals per atom, will correct with *empty* orbitals.")
        geom, is_copy = get_copy(geom, is_copy)

        # Now create a new atom specie with the correct number of orbitals
        norbs = geom_b.atoms.orbitals[:]
        atoms = Atoms([geom.atoms[i].copy(orbitals=[-1.] * norbs[i]) for i in range(geom.na)])
        geom._atoms = atoms

    return geom


@set_module("sisl.io.siesta")
class onlysSileSiesta(SileBinSiesta):
    """ Geometry and overlap matrix """

[docs] def read_supercell(self): """ Returns a SuperCell object from a TranSiesta file """ n_s = _siesta.read_tshs_sizes(self.file)[3] self._fortran_check('read_supercell', 'could not read sizes.') arr = _siesta.read_tshs_cell(self.file, n_s) self._fortran_check('read_supercell', 'could not read cell.') nsc = np.array(arr[0], np.int32) # We have to transpose since the data is read *as-is* # The cell in fortran files are (:, A1) # after reading this is still obeyed (regardless of order) # So we transpose to get it C-like # Note that care must be taken for the different data-structures # In particular not all data needs to be transposed (sparse H and S) cell = arr[1].T * _Bohr2Ang return SuperCell(cell, nsc=nsc)
[docs] def read_geometry(self, geometry=None): """ Returns Geometry object from a TranSiesta file """ # Read supercell sc = self.read_supercell() na = _siesta.read_tshs_sizes(self.file)[1] self._fortran_check('read_geometry', 'could not read sizes.') arr = _siesta.read_tshs_geom(self.file, na) self._fortran_check('read_geometry', 'could not read geometry.') # see onlysSileSiesta.read_supercell for .T xyz = arr[0].T * _Bohr2Ang lasto = arr[1] # Since the TSHS file does not contain species information # and/or other stuff we *can* reuse an existing # geometry which contains the correct atomic numbers etc. orbs = np.diff(lasto) if geometry is None: # Create all different atoms... # The TSHS file does not contain the # atomic numbers, so we will just # create them individually # Get unique orbitals uorb = np.unique(orbs) # Create atoms atoms = [] for Z, orb in enumerate(uorb): atoms.append(Atom(Z+1, [-1] * orb)) def get_atom(atoms, orbs): for atom in atoms: if atom.no == orbs: return atom atom = [] for orb in orbs: atom.append(get_atom(atoms, orb)) else: # Create a new geometry with the correct atomic numbers atom = [] for ia, no in zip(geometry, orbs): a = geometry.atoms[ia] if a.no == no: atom.append(a) else: # correct atom atom.append(a.__class__(a.Z, [-1. for io in range(no)], mass=a.mass, tag=a.tag)) # Create and return geometry object return Geometry(xyz, atom, sc=sc)
[docs] def read_overlap(self, **kwargs): """ Returns the overlap matrix from the TranSiesta file """ tshs_g = self.read_geometry() geom = _geometry_align(tshs_g, kwargs.get('geometry', tshs_g), self.__class__, 'read_overlap') # read the sizes used... sizes = _siesta.read_tshs_sizes(self.file) self._fortran_check('read_overlap', 'could not read sizes.') # see onlysSileSiesta.read_supercell for .T isc = _siesta.read_tshs_cell(self.file, sizes[3])[2].T self._fortran_check('read_overlap', 'could not read cell.') no = sizes[2] nnz = sizes[4] ncol, col, dS = _siesta.read_tshs_s(self.file, no, nnz) self._fortran_check('read_overlap', 'could not read overlap matrix.') # Create the Hamiltonian container S = Overlap(geom, nnzpr=1) # Create the new sparse matrix S._csr.ncol = ncol.astype(np.int32, copy=False) S._csr.ptr = _ncol_to_indptr(ncol) # Correct fortran indices S._csr.col = col.astype(np.int32, copy=False) - 1 S._csr._nnz = len(col) S._csr._D = _a.emptyd([nnz, 1]) S._csr._D[:, 0] = dS[:] # Convert to sisl supercell # equivalent as _csr_from_siesta with explicit isc from file _csr_from_sc_off(S.geometry, isc, S._csr) # In siesta the matrix layout is written in CSC format # due to fortran indexing, this means that we need to transpose # to get it to correct layout. return S.transpose(sort=kwargs.get("sort", True))
[docs] def read_fermi_level(self): r""" Query the Fermi-level contained in the file Returns ------- Ef : fermi-level of the system """ Ef = _siesta.read_tshs_ef(self.file) * _Ry2eV self._fortran_check('read_fermi_level', 'could not read fermi-level.') return Ef
@set_module("sisl.io.siesta") class tshsSileSiesta(onlysSileSiesta): """ Geometry, Hamiltonian and overlap matrix file """
[docs] def read_hamiltonian(self, **kwargs): """ Returns the electronic structure from the siesta.TSHS file """ tshs_g = self.read_geometry() geom = _geometry_align(tshs_g, kwargs.get('geometry', tshs_g), self.__class__, 'read_hamiltonian') # read the sizes used... sizes = _siesta.read_tshs_sizes(self.file) self._fortran_check('read_hamiltonian', 'could not read sizes.') # see onlysSileSiesta.read_supercell for .T isc = _siesta.read_tshs_cell(self.file, sizes[3])[2].T self._fortran_check('read_hamiltonian', 'could not read cell.') spin = sizes[0] no = sizes[2] nnz = sizes[4] ncol, col, dH, dS = _siesta.read_tshs_hs(self.file, spin, no, nnz) self._fortran_check('read_hamiltonian', 'could not read Hamiltonian and overlap matrix.') # Check whether it is an orthogonal basis set orthogonal = np.abs(dS).sum() == geom.no # Create the Hamiltonian container H = Hamiltonian(geom, spin, nnzpr=1, orthogonal=orthogonal) # Create the new sparse matrix H._csr.ncol = ncol.astype(np.int32, copy=False) H._csr.ptr = _ncol_to_indptr(ncol) # Correct fortran indices H._csr.col = col.astype(np.int32, copy=False) - 1 H._csr._nnz = len(col) if orthogonal: H._csr._D = _a.emptyd([nnz, spin]) H._csr._D[:, :] = dH[:, :] * _Ry2eV else: H._csr._D = _a.emptyd([nnz, spin+1]) H._csr._D[:, :spin] = dH[:, :] * _Ry2eV H._csr._D[:, spin] = dS[:] _mat_spin_convert(H) # Convert to sisl supercell # equivalent as _csr_from_siesta with explicit isc from file _csr_from_sc_off(H.geometry, isc, H._csr) # Find all indices where dS == 1 (remember col is in fortran indices) idx = col[np.isclose(dS, 1.).nonzero()[0]] if np.any(idx > no): print(f'Number of orbitals: {no}') print(idx) raise SileError(f'{self!s}.read_hamiltonian could not assert ' 'the supercell connections in the primary unit-cell.') # see onlysSileSiesta.read_overlap for .transpose() # For H, DM and EDM we also need to Hermitian conjugate it. return H.transpose(spin=False, sort=kwargs.get("sort", True))
[docs] def write_hamiltonian(self, H, **kwargs): """ Writes the Hamiltonian to a siesta.TSHS file """ # we sort below, so no need to do it here # see onlysSileSiesta.read_overlap for .transpose() csr = H.transpose(spin=False, sort=False)._csr if csr.nnz == 0: raise SileError(f'{self!s}.write_hamiltonian cannot write ' 'a zero element sparse matrix!') # Convert to siesta CSR _csr_to_siesta(H.geometry, csr) csr.finalize(sort=kwargs.get("sort", True)) _mat_spin_convert(csr, H.spin) # Extract the data to pass to the fortran routine cell = H.geometry.cell xyz = H.geometry.xyz # Get H and S if H.orthogonal: h = csr._D s = csr.diags(1., dim=1) # Ensure all data is correctly formatted (i.e. have the same sparsity pattern) s.align(csr) s.finalize(sort=kwargs.get("sort", True)) if s.nnz != len(h): raise SislError('The diagonal elements of your orthogonal Hamiltonian ' 'have not been defined, this is a requirement.') s = s._D[:, 0] else: h = csr._D[:, :H.S_idx] s = csr._D[:, H.S_idx] # Get shorter variants nsc = H.geometry.nsc[:].astype(np.int32) isc = _siesta.siesta_sc_off(*nsc) # see onlysSileSiesta.read_supercell for .T _siesta.write_tshs_hs(self.file, nsc[0], nsc[1], nsc[2], cell.T / _Bohr2Ang, xyz.T / _Bohr2Ang, H.geometry.firsto, csr.ncol, csr.col + 1, _toF(h, np.float64, _eV2Ry), _toF(s, np.float64), isc) self._fortran_check('write_hamiltonian', 'could not write Hamiltonian and overlap matrix.')
@set_module("sisl.io.siesta") class dmSileSiesta(SileBinSiesta): """ Density matrix file """
[docs] def read_density_matrix(self, **kwargs): """ Returns the density matrix from the siesta.DM file """ # Now read the sizes used... spin, no, nsc, nnz = _siesta.read_dm_sizes(self.file) self._fortran_check('read_density_matrix', 'could not read density matrix sizes.') ncol, col, dDM = _siesta.read_dm(self.file, spin, no, nsc, nnz) self._fortran_check('read_density_matrix', 'could not read density matrix.') # Try and immediately attach a geometry geom = kwargs.get('geometry', kwargs.get('geom', None)) if geom is None: # We truly, have no clue, # Just generate a boxed system xyz = [[x, 0, 0] for x in range(no)] sc = SuperCell([no, 1, 1], nsc=nsc) geom = Geometry(xyz, Atom(1), sc=sc) if nsc[0] != 0 and np.any(geom.nsc != nsc): # We have to update the number of supercells! geom.set_nsc(nsc) if geom.no != no: raise SileError(f'{self!s}.read_density_matrix could not use the ' 'passed geometry as the number of atoms or orbitals is ' 'inconsistent with DM file.') # Create the density matrix container DM = DensityMatrix(geom, spin, nnzpr=1, dtype=np.float64, orthogonal=False) # Create the new sparse matrix DM._csr.ncol = ncol.astype(np.int32, copy=False) DM._csr.ptr = _ncol_to_indptr(ncol) # Correct fortran indices DM._csr.col = col.astype(np.int32, copy=False) - 1 DM._csr._nnz = len(col) DM._csr._D = _a.emptyd([nnz, spin+1]) DM._csr._D[:, :spin] = dDM[:, :] # DM file does not contain overlap matrix... so neglect it for now. DM._csr._D[:, spin] = 0. _mat_spin_convert(DM) # Convert the supercells to sisl supercells if nsc[0] != 0 or geom.no_s >= col.max(): _csr_from_siesta(geom, DM._csr) else: warn(f'{self!s}.read_density_matrix may result in a wrong sparse pattern!') return DM.transpose(spin=False, sort=kwargs.get("sort", True))
[docs] def write_density_matrix(self, DM, **kwargs): """ Writes the density matrix to a siesta.DM file """ csr = DM.transpose(spin=False, sort=False)._csr # This ensures that we don't have any *empty* elements if csr.nnz == 0: raise SileError(f'{self!s}.write_density_matrix cannot write ' 'a zero element sparse matrix!') _csr_to_siesta(DM.geometry, csr) # We do not really need to sort this one, but we do for consistency # of the interface. csr.finalize(sort=kwargs.get("sort", True)) _mat_spin_convert(csr, DM.spin) # Get DM if DM.orthogonal: dm = csr._D else: dm = csr._D[:, :DM.S_idx] # Ensure shapes (say if only 1 spin) dm.shape = (-1, len(DM.spin)) nsc = DM.geometry.sc.nsc.astype(np.int32) _siesta.write_dm(self.file, nsc, csr.ncol, csr.col + 1, _toF(dm, np.float64)) self._fortran_check('write_density_matrix', 'could not write density matrix.')
@set_module("sisl.io.siesta") class tsdeSileSiesta(dmSileSiesta): """ Non-equilibrium density matrix and energy density matrix file """
[docs] def read_energy_density_matrix(self, **kwargs): """ Returns the energy density matrix from the siesta.DM file """ # Now read the sizes used... spin, no, nsc, nnz = _siesta.read_tsde_sizes(self.file) self._fortran_check('read_energy_density_matrix', 'could not read energy density matrix sizes.') ncol, col, dEDM = _siesta.read_tsde_edm(self.file, spin, no, nsc, nnz) self._fortran_check('read_energy_density_matrix', 'could not read energy density matrix.') # Try and immediately attach a geometry geom = kwargs.get('geometry', kwargs.get('geom', None)) if geom is None: # We truly, have no clue, # Just generate a boxed system xyz = [[x, 0, 0] for x in range(no)] sc = SuperCell([no, 1, 1], nsc=nsc) geom = Geometry(xyz, Atom(1), sc=sc) if nsc[0] != 0 and np.any(geom.nsc != nsc): # We have to update the number of supercells! geom.set_nsc(nsc) if geom.no != no: raise SileError(f'{self!s}.read_energy_density_matrix could ' 'not use the passed geometry as the number of atoms or orbitals ' 'is inconsistent with DM file.') # Create the energy density matrix container EDM = EnergyDensityMatrix(geom, spin, nnzpr=1, dtype=np.float64, orthogonal=False) # Create the new sparse matrix EDM._csr.ncol = ncol.astype(np.int32, copy=False) EDM._csr.ptr = _ncol_to_indptr(ncol) # Correct fortran indices EDM._csr.col = col.astype(np.int32, copy=False) - 1 EDM._csr._nnz = len(col) EDM._csr._D = _a.emptyd([nnz, spin+1]) EDM._csr._D[:, :spin] = dEDM[:, :] * _Ry2eV # EDM file does not contain overlap matrix... so neglect it for now. EDM._csr._D[:, spin] = 0. _mat_spin_convert(EDM) # Convert the supercells to sisl supercells if nsc[0] != 0 or geom.no_s >= col.max(): _csr_from_siesta(geom, EDM._csr) else: warn(f'{self!s}.read_energy_density_matrix may result in a wrong sparse pattern!') return EDM.transpose(spin=False, sort=kwargs.get("sort", True))
[docs] def read_fermi_level(self): r""" Query the Fermi-level contained in the file Returns ------- Ef : fermi-level of the system """ Ef = _siesta.read_tsde_ef(self.file) * _Ry2eV self._fortran_check('read_fermi_level', 'could not read fermi-level.') return Ef
[docs] def write_density_matrices(self, DM, EDM, Ef=0., **kwargs): r""" Writes the density matrix to a siesta.DM file Parameters ---------- DM : DensityMatrix density matrix to write to the file EDM : EnergyDensityMatrix energy density matrix to write to the file Ef : float, optional fermi-level to be contained """ DMcsr = DM.transpose(spin=False, sort=False)._csr EDMcsr = EDM.transpose(spin=False, sort=False)._csr DMcsr.align(EDMcsr) EDMcsr.align(DMcsr) if DMcsr.nnz == 0: raise SileError(f'{self!s}.write_density_matrices cannot write ' 'a zero element sparse matrix!') _csr_to_siesta(DM.geometry, DMcsr) _csr_to_siesta(DM.geometry, EDMcsr) sort = kwargs.get("sort", True) DMcsr.finalize(sort=sort) EDMcsr.finalize(sort=sort) _mat_spin_convert(DMcsr, DM.spin) _mat_spin_convert(EDMcsr, EDM.spin) # Ensure everything is correct if not (np.allclose(DMcsr.ncol, EDMcsr.ncol) and np.allclose(DMcsr.col, EDMcsr.col)): raise ValueError(f'{self!s}.write_density_matrices got non compatible ' 'DM and EDM matrices.') if DM.orthogonal: dm = DMcsr._D else: dm = DMcsr._D[:, :DM.S_idx] if EDM.orthogonal: edm = EDMcsr._D else: edm = EDMcsr._D[:, :EDM.S_idx] nsc = DM.geometry.sc.nsc.astype(np.int32) _siesta.write_tsde_dm_edm(self.file, nsc, DMcsr.ncol, DMcsr.col + 1, _toF(dm, np.float64), _toF(edm, np.float64, _eV2Ry), Ef * _eV2Ry) self._fortran_check('write_density_matrices', 'could not write DM + EDM matrices.')
@set_module("sisl.io.siesta") class hsxSileSiesta(SileBinSiesta): """ Hamiltonian and overlap matrix file This file does not contain all information regarding the system. To ensure no errors are being raised one should pass a `Geometry` with correct number of atoms and correct number of supercells. The number of orbitals will be updated in the returned matrices geometry. >>> hsx = hsxSileSiesta("siesta.HSX") >>> HS = hsx.read_hamiltonian() # may fail >>> HS = hsx.read_hamiltonian(geometry=<>) # should run correctly if above satisfied Users are adviced to use the `tshsSileSiesta` instead since that correctly contains all information. """ def _xij2system(self, xij, geometry=None): """ Create a new geometry with *correct* nsc and somewhat correct xyz Parameters ---------- xij : SparseCSR orbital distances geometry : Geometry, optional passed geometry """ def get_geom_handle(xij): atoms = self._read_atoms() if not atoms is None: return Geometry(np.zeros([len(atoms), 3]), atoms) N = len(xij) # convert csr to dok format row = (xij.ncol > 0).nonzero()[0] # Now we have [0 0 0 0 1 1 1 1 2 2 ... no-1 no-1] row = np.repeat(row, xij.ncol[row]) col = xij.col # Parse xij to correct geometry # first figure out all zeros (i.e. self-atom-orbitals) idx0 = np.isclose(np.fabs(xij._D).sum(axis=1), 0.).nonzero()[0] row0 = row[idx0] # convert row0 and col0 to a first attempt of "atomization" atoms = [] for r in range(N): idx0r = (row0 == r).nonzero()[0] row0r = row0[idx0r] # although xij == 0, we just do % to ensure unit-cell orbs col0r = col[idx0[idx0r]] % N if np.all(col0r >= r): # we have a new atom atoms.append(set(col0r)) else: atoms[-1].update(set(col0r)) # convert list of orbitals to lists def conv(a): a = list(a) a.sort() return a atoms = [list(a) for a in atoms] if sum(map(len, atoms)) != len(xij): raise ValueError(f"{self.__class__.__name__} could not determine correct " "number of orbitals.") atms = Atoms(Atom('H', [-1. for _ in atoms[0]])) for orbs in atoms[1:]: atms.append(Atom('H', [-1. for _ in orbs])) return Geometry(np.zeros([len(atoms), 3]), atms) geom_handle = get_geom_handle(xij) def convert_to_atom(geom, xij): # o2a does not check for correct super-cell index n_s = xij.shape[1] // xij.shape[0] atm_s = geom.o2a(np.arange(xij.shape[1])) # convert csr to dok format row = (xij.ncol > 0).nonzero()[0] row = np.repeat(row, xij.ncol[row]) col = xij.col arow = atm_s[row] acol = atm_s[col] del atm_s, row, col idx = np.lexsort((acol, arow)) arow = arow[idx] acol = acol[idx] xij = xij._D[idx] del idx # Now figure out if xij is consistent duplicates = np.logical_and(np.diff(acol) == 0, np.diff(arow) == 0).nonzero()[0] if duplicates.size > 0: if not np.allclose(xij[duplicates+1] - xij[duplicates], 0.): raise ValueError(f"{self.__class__.__name__} converting xij(orb) -> xij(atom) went wrong. " "This may happen if your coordinates are not inside the unitcell, please pass " "a usable geometry.") # remove duplicates to create new matrix arow = np.delete(arow, duplicates) acol = np.delete(acol, duplicates) xij = np.delete(xij, duplicates, axis=0) # Create a new sparse matrix # Create the new index pointer indptr = np.insert(np.array([0, len(xij)], np.int32), 1, (np.diff(arow) != 0).nonzero()[0] + 1) assert len(indptr) == geom.na + 1 return SparseCSR((xij, acol, indptr), shape=(geom.na, geom.na * n_s)) def coord_from_xij(xij): # first atom is at 0, 0, 0 na = len(xij) xyz = _a.zerosd([na, 3]) xyz[0] = [0, 0, 0] mark = _a.zerosi(na) mark[0] = 1 run_atoms = deque([0]) while len(run_atoms) > 0: atm = run_atoms.popleft() xyz_atm = xyz[atm].reshape(1, 3) neighbours = xij.edges(atm, exclude=atm) neighbours = neighbours[neighbours < na] # update those that haven't been calculated idx = mark[neighbours] == 0 neigh_idx = neighbours[idx] if len(neigh_idx) == 0: continue xyz[neigh_idx, :] = xij[atm, neigh_idx] - xyz_atm mark[neigh_idx] = 1 # add more atoms to be processed, since we have *mark* # we will only run every atom once run_atoms.extend(neigh_idx.tolist()) # check that everything is correct if (~idx).sum() > 0: neg_neighbours = neighbours[~idx] if not np.allclose(xyz[neg_neighbours, :], xij[atm, neg_neighbours] - xyz_atm): raise ValueError(f"{self.__class__.__name__} xij(orb) -> xyz did not " f"find same coordinates for different connections") if mark.sum() != na: raise ValueError(f"{self.__class__.__name__} xij(orb) -> Geometry does not " f"have a fully connected geometry. It is impossible to create relative coordinates") return xyz def sc_from_xij(xij, xyz): na = xij.shape[0] n_s = xij.shape[1] // xij.shape[0] if n_s == 1: # easy!! return SuperCell(xyz.max(axis=0) - xyz.min(axis=0) + 10., nsc=[1] * 3) sc_off = _a.zerosd([n_s, 3]) mark = _a.zerosi(n_s) mark[0] = 1 for atm in range(na): neighbours = xij.edges(atm, exclude=atm) uneighbours = neighbours % na neighbour_isc = neighbours // na # get offset in terms of unit-cell off = xij[atm, neighbours] - (xyz[uneighbours] - xyz[atm].reshape(1, 3)) idx = mark[neighbour_isc] == 0 if not np.allclose(off[~idx], sc_off[neighbour_isc[~idx]]): raise ValueError(f"{self.__class__.__name__} xij(orb) -> xyz did not " f"find same supercell offsets for different connections") if idx.sum() == 0: continue for idx in idx.nonzero()[0]: nidx = neighbour_isc[idx] if mark[nidx] == 0: mark[nidx] = 1 sc_off[nidx] = off[idx] elif not np.allclose(sc_off[nidx], off[idx]): raise ValueError(f"{self.__class__.__name__} xij(orb) -> xyz did not " f"find same supercell offsets for different connections") # We know that siesta returns isc # for iz in [0, 1, 2, 3, -3, -2, -1]: # for iy in [0, 1, 2, -2, -1]: # for ix in [0, 1, -1]: # every block we find a half monotonically increasing vector additions # Note the first is always [0, 0, 0] # So our best chance is to *guess* the first nsc # then reshape, then guess, then reshape, then guess :) sc_diff = np.diff(sc_off, axis=0) def get_nsc(sc_off): """ Determine nsc depending on the axis """ # correct the offsets ndim = sc_off.ndim if sc_off.shape[0] == 1: return 1 # always select the 2nd one since that contains the offset # for the first isc [1, 0, 0] or [0, 1, 0] or [0, 0, 1] sc_dir = sc_off[(1, ) + np.index_exp[0] * (ndim - 2)].reshape(1, 3) norm2_sc_dir = (sc_dir ** 2).sum() # figure out the maximum integer part # we select 0 indices for all already determined lattice # vectors since we know the first one is [0, 0, 0] idx = np.index_exp[:] + np.index_exp[0] * (ndim - 2) projection = (sc_off[idx] * sc_dir).sum(-1) / norm2_sc_dir iprojection = np.rint(projection) # reduce, find 0 idx_zero = np.isclose(iprojection, 0, atol=1e-5).nonzero()[0] if idx_zero.size <= 1: return 1 # only take those values that are continuous # we *must* have some supercell connections idx_max = idx_zero[1] # find where they are close # since there may be *many* zeros (non-coupling elements) # we first have to cut off anything that is not integer if np.allclose(projection[:idx_max], iprojection[:idx_max], atol=1e-5): return idx_max raise ValueError(f"Could not determine nsc from coordinates") nsc = _a.onesi(3) nsc[0] = get_nsc(sc_off) sc_off = sc_off.reshape(-1, nsc[0], 3) nsc[1] = get_nsc(sc_off) sc_off = sc_off.reshape(-1, nsc[1], nsc[0], 3) nsc[2] = sc_off.shape[0] # now determine cell parameters if all(nsc > 1): cell = _a.arrayd([sc_off[0, 0, 1], sc_off[0, 1, 0], sc_off[1, 0, 0]]) else: # we will never have all(nsc == 1) since that is # taken care of at the start # this gets a bit tricky, since we don't know one of the # lattice vectors cell = _a.zerosd([3, 3]) i = 0 for idx, isc in enumerate(nsc): if isc > 1: sl = [0, 0, 0] sl[2 - idx] = 1 cell[i] = sc_off[tuple(sl)] i += 1 # figure out the last vectors # We'll just use Cartesian coordinates while i < 3: # this means we don't have any supercell connections # along at least 1 other lattice vector. lcell = np.fabs(cell).sum(0) # figure out which Cartesian direction we are *missing* cart_dir = np.argmin(lcell) cell[i, cart_dir] = xyz[:, cart_dir].max() - xyz[:, cart_dir].min() + 10. i += 1 return SuperCell(cell, nsc) # now we have all orbitals, ensure compatibility with passed geometry if geometry is None: atm_xij = convert_to_atom(geom_handle, xij) xyz = coord_from_xij(atm_xij) sc = sc_from_xij(atm_xij, xyz) geometry = Geometry(xyz, geom_handle.atoms, sc) # Move coordinates into unit-cell geometry.xyz[:, :] = (geometry.fxyz % 1.) @ geometry.cell else: if geometry.n_s != xij.shape[1] // xij.shape[0]: atm_xij = convert_to_atom(geom_handle, xij) sc = sc_from_xij(atm_xij, coord_from_xij(atm_xij)) geometry.set_nsc(sc.nsc) def conv(orbs, atm): if len(orbs) == len(atm): return atm return atm.copy(orbitals=[-1. for _ in orbs]) atms = Atoms(list(map(conv, geom_handle.atoms, geometry.atoms))) if len(atms) != len(geometry): raise ValueError(f"{self.__class__.__name__} passed geometry for reading " "sparse matrix does not contain same number of atoms!") geometry = geometry.copy() # TODO check that geometry and xyz are the same! geometry._atoms = atms return geometry def _read_atoms(self, **kwargs): """ Reads basis set and geometry information from the HSX file """ # Now read the sizes used... no, na, nspecies = _siesta.read_hsx_specie_sizes(self.file) self._fortran_check('read_geometry', 'could not read specie sizes.') # Read specie information labels, val_q, norbs, isa = _siesta.read_hsx_species(self.file, nspecies, no, na) # convert to proper string labels = labels.T.reshape(nspecies, -1) labels = labels.view(f"S{labels.shape[1]}") labels = list(map(lambda s: b''.join(s).decode('utf-8').strip(), labels.tolist()) ) self._fortran_check('read_geometry', 'could not read species.') # to python index isa -= 1 from sisl.atom import _ptbl # try and convert labels into symbols # We do this by: # 1. label -> symbol # 2. label[:2] -> symbol # 3. label[:1] -> symbol symbols = [] lbls = [] for label in labels: lbls.append(label) try: symbol = _ptbl.Z_label(label) symbols.append(symbol) continue except: pass try: symbol = _ptbl.Z_label(label[:2]) symbols.append(symbol) continue except: pass try: symbol = _ptbl.Z_label(label[:1]) symbols.append(symbol) continue except: # we have no clue, assign -1 symbols.append(-1) # Read in orbital information atoms = [] for ispecie in range(nspecies): n_l_zeta = _siesta.read_hsx_specie(self.file, ispecie+1, norbs[ispecie]) self._fortran_check('read_geometry', f'could not read specie {ispecie}.') # create orbital # no shell will have l>5, so m=10 should be more than enough m = 10 orbs = [] for n, l, zeta in zip(*n_l_zeta): # manual loop on m quantum numbers if m > l: m = -l orbs.append(AtomicOrbital(n=n, l=l, m=m, zeta=zeta, R=-1.)) m += 1 # now create atom atoms.append(Atom(symbols[ispecie], orbs, tag=lbls[ispecie])) # now read in xij to retrieve atomic positions Gamma, spin, no, no_s, nnz = _siesta.read_hsx_sizes(self.file) self._fortran_check('read_geometry', 'could not read matrix sizes.') ncol, col, _, dxij = _siesta.read_hsx_sx(self.file, Gamma, spin, no, no_s, nnz) dxij = dxij.T * _Bohr2Ang col -= 1 self._fortran_check('read_geometry', 'could not read xij matrix.') # now create atoms object atoms = Atoms([atoms[ia] for ia in isa]) return atoms
[docs] def read_hamiltonian(self, **kwargs): """ Returns the electronic structure from the siesta.TSHS file """ # Now read the sizes used... Gamma, spin, no, no_s, nnz = _siesta.read_hsx_sizes(self.file) self._fortran_check('read_hamiltonian', 'could not read Hamiltonian sizes.') ncol, col, dH, dS, dxij = _siesta.read_hsx_hsx(self.file, Gamma, spin, no, no_s, nnz) dxij = dxij.T * _Bohr2Ang col -= 1 self._fortran_check('read_hamiltonian', 'could not read Hamiltonian.') ptr = _ncol_to_indptr(ncol) xij = SparseCSR((dxij, col, ptr), shape=(no, no_s)) geom = self._xij2system(xij, kwargs.get('geometry', kwargs.get('geom', None))) if geom.no != no or geom.no_s != no_s: raise SileError(f"{str(self)}.read_hamiltonian could not use the " "passed geometry as the number of atoms or orbitals is " "inconsistent with HSX file.") # Create the Hamiltonian container H = Hamiltonian(geom, spin, nnzpr=1, dtype=np.float32, orthogonal=False) # Create the new sparse matrix H._csr.ncol = ncol.astype(np.int32, copy=False) H._csr.ptr = ptr # Correct fortran indices H._csr.col = col.astype(np.int32, copy=False) H._csr._nnz = len(col) H._csr._D = _a.emptyf([nnz, spin+1]) H._csr._D[:, :spin] = dH[:, :] * _Ry2eV H._csr._D[:, spin] = dS[:] _mat_spin_convert(H) # Convert the supercells to sisl supercells if no_s // no == np.product(geom.nsc): _csr_from_siesta(geom, H._csr) return H.transpose(spin=False, sort=kwargs.get("sort", True))
[docs] def read_overlap(self, **kwargs): """ Returns the overlap matrix from the siesta.HSX file """ # Now read the sizes used... Gamma, spin, no, no_s, nnz = _siesta.read_hsx_sizes(self.file) self._fortran_check('read_overlap', 'could not read overlap matrix sizes.') ncol, col, dS, dxij = _siesta.read_hsx_sx(self.file, Gamma, spin, no, no_s, nnz) dxij = dxij.T * _Bohr2Ang col -= 1 self._fortran_check('read_overlap', 'could not read overlap matrix.') ptr = _ncol_to_indptr(ncol) xij = SparseCSR((dxij, col, ptr), shape=(no, no_s)) geom = self._xij2system(xij, kwargs.get('geometry', kwargs.get('geom', None))) if geom.no != no or geom.no_s != no_s: raise SileError(f"{str(self)}.read_overlap could not use the " "passed geometry as the number of atoms or orbitals is " "inconsistent with HSX file.") # Create the Hamiltonian container S = Overlap(geom, nnzpr=1) # Create the new sparse matrix S._csr.ncol = ncol.astype(np.int32, copy=False) S._csr.ptr = _ncol_to_indptr(ncol) # Correct fortran indices S._csr.col = col.astype(np.int32, copy=False) S._csr._nnz = len(col) S._csr._D = _a.emptyf([nnz, 1]) S._csr._D[:, 0] = dS[:] # Convert the supercells to sisl supercells if no_s // no == np.product(geom.nsc): _csr_from_siesta(geom, S._csr) # not really necessary with Hermitian transposing, but for consistency return S.transpose(sort=kwargs.get("sort", True))
@set_module("sisl.io.siesta") class wfsxSileSiesta(SileBinSiesta): r""" Binary WFSX file reader for Siesta The WFSX file assumes that users initialize the object with a `parent` argument (or one of the other geometry related objects as shown below). The `parent` argument is necessary to convert WFSX k-points from 1/Ang to reduced coordinates. When returning `EigenstateElectron` objects the parent of these objects are the equivalent of the `parent` argument upon initialization. Therefore please remember to pass a correct `parent`. Parameters ---------- parent : obj, optional a parent may contain a geometry, and/or a supercell geometry : Geometry, optional a geometry contains a cell with corresponding lattice vectors used to convert k [1/Ang] -> [b] sc : SuperCell, optional a supercell contains the lattice vectors to convert k """ def _setup(self, *args, **kwargs): """ Simple setup that needs to be overwritten All _read_next_* methods expect the fortran file unit to be handled and that the position in the file is correct. """ super()._setup(*args, **kwargs) # default sc sc = None # In case the instantiation was called with wfsxSileSiesta("path", geometry=geometry) parent = kwargs.get("parent") if parent is None: geometry = None elif isinstance(parent, Geometry): geometry = parent elif isinstance(parent, SuperCell): sc = parent else: geometry = parent.geometry geometry = kwargs.get("geometry", geometry) if geometry is not None and sc is None: sc = geometry.sc sc = kwargs.get("sc", sc) if sc is None and geometry is not None: raise ValueError(f"{self.__class__.__name__}(geometry=Geometry, sc=None) is not an allowed argument combination.") if parent is None: parent = geometry if parent is None: parent = sc self._parent = parent self._geometry = geometry self._sc = sc if self._parent is None and self._geometry is None and self._sc is None: def conv(k): if not np.allclose(k, 0.): warn(f"{self.__class__.__name__} cannot convert stored k-points from 1/Ang to reduced coordinates. Please ensure 'parent=Hamiltonian', 'geometry=Geometry', or 'sc=SuperCell' to ensure reduced k") return k / _Bohr2Ang else: def conv(k): return (k @ sc.cell.T) / (2 * pi * _Bohr2Ang) self._convert_k = conv def _open_wfsx(self, mode, rewind=False): """Open the file unit for the WFSX file. Here we also initialize some variables to keep track of the state of the read. """ self._fortran_open(mode, rewind=rewind) # Here we initialize the variables that will keep track of the state of the read. # The process for identification is done on this basis: # _ik is the current (Python) index for the k-point to be read # _ispin is the current (Python) index for the spin-index to be read (only has meaning for a spin-polarized # WFSX files) # _state is: # -1 : the file-descriptor has just been opened (i.e. in front of header) # 0 : it means that the file-descriptor is in front of basis information # 1 : it means that the file-descriptor is in front of k point information # 2 : it means that the file-descriptor is in front of k point WFSX values # self._state = -1 self._ispin = 0 self._ik = 0 def _close_wfsx(self): """Close the file unit for the WFSX file. We clean the variables used to keep track of read state. """ self._fortran_close() # Clean variables del self._state del self._ik del self._ispin try: del self._sizes except: pass try: del self._basis except: pass try: del self._funcs except: pass def _setup_parsing(self, close=True, skip_basis=True): """Gets all the things needed to parse the wfsx file. Parameters ----------- close: bool, optional Whether the file unit should be closed afterwards. skip_basis : bool, optional whether to also read the basis or not """ self._open_wfsx('r') # Read the sizes relevant to the file. # We also read whether there's only gamma point information or there are multiple points self._sizes = self._read_next_sizes(skip_basis=skip_basis) if not skip_basis: self._basis = self._read_next_basis() # Get the functions that should be used to parse state values. if self._sizes.nspin in (4, 8): # We will have twice as many coefficients. func_index = 4 elif self._sizes.Gamma: # State values will be in double precision floats func_index = 1 else: # State values will be in double precision complex func_index = 2 Funcs = namedtuple("WFSXReads", ["read_index", "read_next"]) self._funcs = Funcs( getattr(_siesta, f"read_wfsx_index_{func_index}"), getattr(_siesta, f"read_wfsx_next_{func_index}") ) if close: self._close_wfsx() def _read_next_sizes(self, skip_basis=False): """Reads the sizes if they are the next thing to be read. Parameters ----------- skip_basis: boolean, optional Whether this method should also skip over the basis information. Returns ------- namedtuple : - 'nspin': int. Number of spin components. - 'no_u': int. Number of orbitals in the unit cell. - 'nk': int. Number of k points in the file. - 'Gamma': bool. Whether the file contains only the gamma point. """ # Check that we are in the right position in the file if self._state != -1: raise SileError(f"We are not in a position to read the sizes. State is: {self._state}") # Read the sizes that we can find in the WFSX file Sizes = namedtuple("Sizes", ["nspin", "no_u", "nk", "Gamma"]) sizes = _siesta.read_wfsx_next_sizes(self._iu, skip_basis) # Inform that we are now in front of k point information self._state = 1 if skip_basis else 0 # Check that everything went fine self._fortran_check('_read_sizes', "could not read sizes") return Sizes(*sizes) def _read_next_basis(self): """Reads the basis if it is the next thing to be read. Returns ------- Atoms: the basis read. """ # Check that we are in the right position in the file if self._state != 0: raise SileError(f"We are not in a position to read the basis. State is: {self._state}") # Read the basis information that we can find in the WFSX file basis_info = _siesta.read_wfsx_next_basis(self._iu, self._sizes.no_u) # Inform that we are now in front of k point information self._state = 1 # Check that everything went fine self._fortran_check('_read_basis', "could not read basis information") # Convert the information to a dict so that code is easier to follow. basis_info = dict(zip(('atom_indices', 'atom_labels', 'orb_index_atom', 'orb_n', 'orb_symmetry'), basis_info)) # Sanitize the string information for char_key in ("atom_labels", "orb_symmetry"): basis_info[char_key] = np.array(["".join(label).rstrip() for label in basis_info[char_key].astype(str)]) # Find out the unique atom indices unique_ats = np.unique(basis_info["atom_indices"]) def _get_atom_object(at): """Given an atom index, generates an Atom object with all the information we have about it""" atom_orbs = np.where(basis_info["atom_indices"] == at)[0] at_label = basis_info["atom_labels"][atom_orbs[0]] orbitals = [ AtomicOrbital(f"{n}{symmetry}") for n, symmetry in zip(basis_info["orb_n"][atom_orbs], basis_info["orb_symmetry"][atom_orbs]) ] return Atom(at_label, orbitals=orbitals) # Generate the Atoms oject. return Atoms([_get_atom_object(at) for at in unique_ats]) def _read_next_info(self, ispin, ik): """Reads the next eigenstate information. This function should only be called after reading the sizes or reading the previous state's values. Parameters ---------- ispin: integer the (python) spin index of the next eigenstate. ik: integer the (python) k index of the next eigenstate. Returns ------- array of shape (3,): The k point of the state. float: The weight of the k point. int: Number of wavefunctions that the state contains. It is needed by the function that reads the eigenstates values. """ # Store the indices of the current state self._ik = ik self._ispin = ispin # Check that we are in a position where we will read state information if self._state != 1: raise SileError(f"We are not in a position to read k point information. State is: {self._state}") # Read the state information file_ispin, file_ik, k, weight, nwf = _siesta.read_wfsx_next_info(self._iu) # Inform that we are now in front of state values self._state = 2 # Check that the read went fine self._fortran_check('_read_next_info', f"could not read next eigenstate info [{ispin + 1}, {ik + 1}]") # Check that the read indices match the indices that we were expecting. if file_ispin != ispin + 1 or file_ik != ik + 1: self._ik = file_ik - 1 self._ispin = file_ispin - 1 raise SileError(f"WFSX indices do not match the expected ones. Expected: [{ispin + 1}, {ik + 1}], found [{file_ispin}, {file_ik}]") return k, weight, nwf def _read_next_values(self, ispin, ik, nwf): """Reads the next eigenstate values. This function should only be called after reading the state's information Parameters ---------- ispin: integer the (python) spin index of the next eigenstate. ik: integer the (python) k index of the next eigenstate. nwf: integer The number of wavefunctions that the next eigenstate contains. Should have been obtained by reading the state's info with `_read_next_info`. Returns ------- array of shape (nwf,): The indices of each wavefunction that the state contains. array of shape (nwf,): The eigenvalues (in eV) of each wavefunction that the state contains. array of shape (norbitals, nwf): The coefficients for each wavefunction that the state contains. """ # Check that we are in the right position in the file if self._state != 2: raise SileError(f"We are not in a position to read k point WFSX values. State is: {self._state}") # Read the state values idx, eig, state = self._funcs.read_next(self._iu, self._sizes.no_u, nwf) # Inform that we are now in front of the next state info self._state = 1 # Check that everything went fine self._fortran_check('_read_next_values', f"could not read next eigenstate values [{ispin + 1}, {ik + 1}]") return idx, eig, state def _read_next_eigenstate(self, ispin, ik): """Reads the next eigenstate in the WFSX file. Parameters ---------- ispin: integer the (python) spin index of the next eigenstate. ik: integer the (python) k index of the next eigenstate. Returns -------- EigenstateElectron: The next eigenstate. """ # Get the information of this eigenstate k, weight, nwf = self._read_next_info(ispin, ik) # Now that we have the information, we can read the values because # we know the number of wavefunctions stored in the k point (`nwf`) idx, eig, state = self._read_next_values(ispin, ik, nwf) # Build the info dictionary for the eigenstate to know how it was calculated # We include the spin index if needed. info = dict(k=self._convert_k(k), weight=weight, gauge="r", index=idx - 1) if self._sizes.nspin == 2: info["spin"] = ispin # `eig` is already in eV # See onlysSileSiesta.read_supercell to understand why we transpose `state` return EigenstateElectron(state.T, eig, parent=self._parent, **info)
[docs] def read_sizes(self): """Reads the sizes related to this WFSX file Returns ------- int : number of spin components int : number of orbitals in the unit-cell int : number of k-points bool : True if the file only contains the Gamma-point """ self._open_wfsx("r") sizes = self._read_next_sizes() self._close_wfsx() return sizes
[docs] def read_basis(self): """Reads the basis contained in the WFSX file. The WFSX file only contains information about the atom labels, which atom each orbital belongs to and the orbital quantum numbers. It is thus not complete in every sense. Returns ------- Atoms: the basis read. """ self._open_wfsx("r") self._sizes = self._read_next_sizes(skip_basis=False) basis = self._read_next_basis() self._close_wfsx() return basis
[docs] def yield_eigenstate(self): r""" Iterates over the states in the WFSX file Yields ------ EigenstateElectron """ # Open file and get parsing information self._setup_parsing(close=False) if self._sizes.nspin == 2: itt_spin = range(2) else: itt_spin = range(1) try: # Iterate over all eigenstates in the WFSX file, yielding control to the caller at # each iteration. for ik, ispin in product(range(self._sizes.nk), itt_spin): yield self._read_next_eigenstate(ispin, ik) # We ran out of eigenstates self._close_wfsx() except GeneratorExit: # The loop in which the generator was used has been broken. self._close_wfsx()
[docs] def read_eigenstate(self, k=(0, 0, 0), spin=0, ktol=1e-4): """Reads a specific eigenstate from the file. This method iterates over the states until it finds a match. Don't call this method repeatedly. If you want to loop eigenstates, use `yield_eigenstate`. Parameters ---------- k: array-like of shape (3,), optional The k point of the state you want to find. spin: integer, optional The spin index of the state you want to find. Only meaningful for polarized calculations. ktol: float, optional The threshold value for considering two k-points the same (i.e. to match the query k point with the state's k point). See Also -------- yield_eigenstate Returns ------- EigenstateElectron or None: If found, the state that was queried. If not found, returns `None`. NOTE this may change to an exception in the future """ # Iterate over all eigenstates in the file for state in self.yield_eigenstate(): if state.info.get("spin", 0) == spin and np.allclose(state.info['k'], k, atol=ktol): # This is the state that the user requested return state return None
[docs] def read_info(self): """Reads the information for all the k points contained in the file Returns ------- k: array of shape (nk, 3) k values of the k points contained in the file. weight: array of shape (nk,) weight of each k point nwf: array of shape (nspin, nk) number of wavefunctions that each kpoint(-spin) contains. """ # Open file and get parsing information self._setup_parsing(close=False, skip_basis=True) # Check if we are in the correct position in the file (we should be just after the header) if self._state != 1: raise ValueError(f"We are not in a position to read eigenstate info in the file. State: {self._state}") # Read all the information. Parse here the k values obtained. # Store the information that should be returned under `returns`. if self._sizes.nspin == 2: nspin = 2 else: nspin = 1 k, kw, nwf = _siesta.read_wfsx_next_all_info(self._iu, 1, self._sizes.nk) # Close the file unit self._close_wfsx() # Check for errors in the read. self._fortran_check("read_info", "could not read file information.") return self._convert_k(k), kw, nwf
[docs] def read_brillouinzone(self): """ Read the brillouin zone object """ k, weight, _ = self.read_info() return BrillouinZone(self._parent, k=k, weight=weight)
@set_module("sisl.io.siesta") class _gridSileSiesta(SileBinSiesta): r""" Binary real-space grid file The Siesta binary grid sile will automatically convert the units from Siesta units (Bohr, Ry) to sisl units (Ang, eV) provided the correct extension is present. """ def read_supercell(self, *args, **kwargs): r""" Return the cell contained in the file """ cell = _siesta.read_grid_cell(self.file).T * _Bohr2Ang self._fortran_check('read_supercell', 'could not read cell.') return SuperCell(cell) def read_grid_size(self): r""" Query grid size information such as the grid size and number of spin components Returns ------- int : number of spin-components mesh : 3 values for the number of mesh-elements """ # Read the sizes nspin, mesh = _siesta.read_grid_sizes(self.file) self._fortran_check('read_grid_size', 'could not read grid sizes.') return nspin, mesh def read_grid(self, index=0, dtype=np.float64, *args, **kwargs): """ Read grid contained in the Grid file Parameters ---------- index : int or array_like, optional the spin-index for retrieving one of the components. If a vector is passed it refers to the fraction per indexed component. I.e. ``[0.5, 0.5]`` will return sum of half the first two components. Default to the first component. dtype : numpy.float64, optional default data-type precision """ index = kwargs.get('spin', index) # Read the sizes and cell nspin, mesh = self.read_grid_size() sc = self.read_supercell() grid = _siesta.read_grid(self.file, nspin, mesh[0], mesh[1], mesh[2]) self._fortran_check('read_grid', 'could not read grid.') if isinstance(index, Integral): grid = grid[:, :, :, index] else: if len(index) > grid.shape[0]: raise ValueError(self.__class__.__name__ + '.read_grid requires spin to be an integer or ' 'an array of length equal to the number of spin components.') # It is F-contiguous, hence the last index g = grid[:, :, :, 0] * index[0] for i, scale in enumerate(index[1:]): g += grid[:, :, :, 1+i] * scale grid = g # Simply create the grid (with no information) # We will overwrite the actual grid g = Grid([1, 1, 1], sc=sc) # NOTE: there is no need to swap-axes since the returned array is in F ordering # and thus the first axis is the fast (x, y, z) is retained g.grid = grid * self.grid_unit return g @set_module("sisl.io.siesta") class _gfSileSiesta(SileBinSiesta): """ Surface Green function file containing, Hamiltonian, overlap matrix and self-energies Do not mix read and write statements when using this code. Complete one or the other before doing the other thing. Fortran does not allow the same file opened twice, if this is needed you are recommended to make a symlink to the file and thus open two different files. This small snippet reads/writes the GF file >>> with sisl.io._gfSileSiesta('hello.GF') as f: ... nspin, no, k, E = f.read_header() ... for ispin, new_k, k, E in f: ... if new_k: ... H, S = f.read_hamiltonian() ... SeHSE = f.read_self_energy() To write a file do: >>> with sisl.io._gfSileSiesta('hello.GF') as f: ... f.write_header(sisl.MonkhorstPack(...), E) ... for ispin, new_k, k, E in f: ... if new_k: ... f.write_hamiltonian(H, S) ... f.write_self_energy(SeHSE) """ def _setup(self, *args, **kwargs): """ Simple setup that needs to be overwritten """ super()._setup(*args, **kwargs) # The unit convention used for energy-points # This is necessary until Siesta uses CODATA values if kwargs.get("version", "old").lower() in ("old", "4.1"): self._E_Ry2eV = 13.60580 else: self._E_Ry2eV = _Ry2eV def _open_gf(self, mode, rewind=False): self._fortran_open(mode, rewind=rewind) # They will at any given time # correspond to the current Python indices that is to be read # The process for identification is done on this basis: # iE is the current (Python) index for the energy-point to be read # ik is the current (Python) index for the k-point to be read # ispin is the current (Python) index for the spin-index to be read (only has meaning for a spin-polarized # GF files) # state is: # -1 : the file-descriptor has just been opened (i.e. in front of header) # 0 : it means that the file-descriptor IS in front of H and S # 1 : it means that the file-descriptor is NOT in front of H and S but somewhere in front of a self-energy # is_read is: # 0 : means that the current indices HAVE NOT been read # 1 : means that the current indices HAVE been read # # All routines in the gf_read/write sources requires input in Python indices self._state = -1 self._is_read = 0 self._ispin = 0 self._ik = 0 self._iE = 0 def _close_gf(self): if not self._fortran_is_open(): return self._fortran_close() # Clean variables del self._state del self._iE del self._ik del self._ispin try: del self._no_u except: pass try: del self._nspin except: pass def _step_counter(self, method, **kwargs): """ Method for stepping values *must* be called before doing the actual read to check correct values """ opt = {'method': method} if kwargs.get('header', False): # The header only exists once, so check whether it is the correct place to read/write if self._state != -1 or self._is_read == 1: raise SileError(self.__class__.__name__ + '.{method} failed because the header has already ' 'been read.'.format(**opt)) self._state = -1 self._ispin = 0 self._ik = 0 self._iE = 0 #print('HEADER: ', self._state, self._ispin, self._ik, self._iE) elif kwargs.get('HS', False): # Correct for the previous state and jump values if self._state == -1: # We have just read the header if self._is_read != 1: raise SileError(self.__class__.__name__ + '.{method} failed because the file descriptor ' 'has not read the header.'.format(**opt)) # Reset values as though the header has just been read self._state = 0 self._ispin = 0 self._ik = 0 self._iE = 0 elif self._state == 0: if self._is_read == 1: raise SileError(self.__class__.__name__ + '.{method} failed because the file descriptor ' 'has already read the current HS for the given k-point.'.format(**opt)) elif self._state == 1: # We have just read from the last energy-point if self._iE + 1 != self._nE or self._is_read != 1: raise SileError(self.__class__.__name__ + '.{method} failed because the file descriptor ' 'has not read all energy-points for a given k-point.'.format(**opt)) self._state = 0 self._ik += 1 if self._ik >= self._nk: # We need to step spin self._ispin += 1 self._ik = 0 self._iE = 0 #print('HS: ', self._state, self._ispin, self._ik, self._iE) if self._ispin >= self._nspin: opt['spin'] = self._ispin + 1 opt['nspin'] = self._nspin raise SileError(self.__class__.__name__ + '.{method} failed because of missing information, ' 'a non-existing entry has been requested! spin={spin} max_spin={nspin}.'.format(**opt)) else: # We are reading an energy-point if self._state == -1: raise SileError(self.__class__.__name__ + '.{method} failed because the file descriptor ' 'has an unknown state.'.format(**opt)) elif self._state == 0: if self._is_read == 1: # Fine, we have just read the HS, ispin and ik are correct self._state = 1 self._iE = 0 else: raise SileError(self.__class__.__name__ + '.{method} failed because the file descriptor ' 'has an unknown state.'.format(**opt)) elif self._state == 1: if self._is_read == 0 and self._iE < self._nE: # we haven't read the current energy-point.and self._iE + 1 < self._nE: pass elif self._is_read == 1 and self._iE + 1 < self._nE: self._iE += 1 else: raise SileError(self.__class__.__name__ + '.{method} failed because the file descriptor ' 'has an unknown state.'.format(**opt)) if self._iE >= self._nE: # You are trying to read beyond the entry opt['iE'] = self._iE + 1 opt['NE'] = self._nE raise SileError(self.__class__.__name__ + '.{method} failed because of missing information, ' 'a non-existing energy-point has been requested! E_index={iE} max_E_index={NE}.'.format(**opt)) #print('SE: ', self._state, self._ispin, self._ik, self._iE) # Always signal (when stepping) that we have not yet read the thing if kwargs.get('read', False): self._is_read = 1 else: self._is_read = 0 def Eindex(self, E): """ Return the closest energy index corresponding to the energy ``E`` Parameters ---------- E : float or int if ``int``, return it-self, else return the energy index which is closests to the energy. """ if isinstance(E, Integral): return E idxE = np.abs(self._E - E).argmin() ret_E = self._E[idxE] if abs(ret_E - E) > 5e-3: warn(self.__class__.__name__ + " requesting energy " + f"{E:.5f} eV, found {ret_E:.5f} eV as the closest energy!") elif abs(ret_E - E) > 1e-3: info(self.__class__.__name__ + " requesting energy " + f"{E:.5f} eV, found {ret_E:.5f} eV as the closest energy!") return idxE def kindex(self, k): """ Return the index of the k-point that is closests to the queried k-point (in reduced coordinates) Parameters ---------- k : array_like of float or int the queried k-point in reduced coordinates :math:`]-0.5;0.5]`. If ``int`` return it-self. """ if isinstance(k, Integral): return k ik = np.sum(np.abs(self._k - _a.asarrayd(k)[None, :]), axis=1).argmin() ret_k = self._k[ik, :] if not np.allclose(ret_k, k, atol=0.0001): warn(SileWarning(self.__class__.__name__ + " requesting k-point " + "[{:.3f}, {:.3f}, {:.3f}]".format(*k) + " found " + "[{:.3f}, {:.3f}, {:.3f}]".format(*ret_k))) return ik def read_header(self): """ Read the header of the file and open it for reading subsequently NOTES: this method may change in the future Returns ------- nspin : number of spin-components stored (1 or 2) no_u : size of the matrices returned k : k points in the GF file E : energy points in the GF file """ # Ensure it is open (in read-mode) if self._fortran_is_open(): _siesta.io_m.rewind_file(self._iu) else: self._open_gf('r') nspin, no_u, nkpt, NE = _siesta.read_gf_sizes(self._iu) self._fortran_check('read_header', 'could not read sizes.') self._nspin = nspin self._nk = nkpt self._nE = NE # We need to rewind (because of k and energy -points) _siesta.io_m.rewind_file(self._iu) self._step_counter('read_header', header=True, read=True) k, E = _siesta.read_gf_header(self._iu, nkpt, NE) self._fortran_check('read_header', 'could not read header information.') if self._nspin > 2: # non-colinear self._no_u = no_u * 2 else: self._no_u = no_u self._E = E * self._E_Ry2eV self._k = k.T return nspin, no_u, self._k, self._E def disk_usage(self): """ Calculate the estimated size of the resulting file Returns ------- estimated disk-space used in GB """ is_open = self._fortran_is_open() if not is_open: self.read_header() # HS are only stored per k-point HS = 2 * self._nspin * self._nk SE = HS / 2 * self._nE # Now calculate the full size # no_u ** 2 = matrix size # 16 = bytes in double complex # 1024 ** 3 = B -> GB mem = (HS + SE) * self._no_u ** 2 * 16 / 1024 ** 3 if not is_open: self._close_gf() return mem def read_hamiltonian(self): """ Return current Hamiltonian and overlap matrix from the GF file Returns ------- complex128 : Hamiltonian matrix complex128 : Overlap matrix """ self._step_counter('read_hamiltonian', HS=True, read=True) H, S = _siesta.read_gf_hs(self._iu, self._no_u) self._fortran_check('read_hamiltonian', 'could not read Hamiltonian and overlap matrices.') # we don't convert to C order! return H * _Ry2eV, S def read_self_energy(self): r""" Read the currently reached bulk self-energy The returned self-energy is: .. math:: \boldsymbol \Sigma_{\mathrm{bulk}}(E) = \mathbf S E - \mathbf H - \boldsymbol \Sigma(E) Returns ------- complex128 : Self-energy matrix """ self._step_counter('read_self_energy', read=True) SE = _siesta.read_gf_se(self._iu, self._no_u, self._iE) self._fortran_check('read_self_energy', 'could not read self-energy.') # we don't convert to C order! return SE * _Ry2eV def HkSk(self, k=(0, 0, 0), spin=0): """ Retrieve H and S for the given k-point Parameters ---------- k : int or array_like of float, optional k-point to read the corresponding Hamiltonian and overlap matrices for. If a specific k-point is passed `kindex` will be used to find the corresponding index. spin : int, optional spin-index for the Hamiltonian and overlap matrices """ if not self._fortran_is_open(): self.read_header() # find k-index that is requested ik = self.kindex(k) _siesta.read_gf_find(self._iu, self._nspin, self._nk, self._nE, self._state, self._ispin, self._ik, self._iE, self._is_read, 0, spin, ik, 0) self._fortran_check('HkSk', 'could not find Hamiltonian and overlap matrix.') self._state = 0 self._ispin = spin self._ik = ik self._iE = 0 self._is_read = 0 # signal this is to be read return self.read_hamiltonian() def self_energy(self, E, k=0, spin=0): """ Retrieve self-energy for a given energy-point and k-point Parameters ---------- E : int or float energy to retrieve self-energy at k : int or array_like of float, optional k-point to retrieve k-point at spin : int, optional spin-index to retrieve self-energy at """ if not self._fortran_is_open(): self.read_header() ik = self.kindex(k) iE = self.Eindex(E) _siesta.read_gf_find(self._iu, self._nspin, self._nk, self._nE, self._state, self._ispin, self._ik, self._iE, self._is_read, 1, spin, ik, iE) self._fortran_check('self_energy', 'could not find requested self-energy.') self._state = 1 self._ispin = spin self._ik = ik self._iE = iE self._is_read = 0 # signal this is to be read return self.read_self_energy() def write_header(self, bz, E, mu=0., obj=None): """ Write to the binary file the header of the file Parameters ---------- bz : BrillouinZone contains the k-points, the weights and possibly the parent Hamiltonian (if `obj` is None)s E : array_like of cmplx or float the energy points. If `obj` is an instance of `SelfEnergy` where an associated ``eta`` is defined then `E` may be float, otherwise it *has* to be a complex array. mu : float, optional chemical potential in the file obj : ..., optional an object that contains the Hamiltonian definitions, defaults to ``bz.parent`` """ if obj is None: obj = bz.parent nspin = len(obj.spin) cell = obj.geometry.sc.cell na_u = obj.geometry.na no_u = obj.geometry.no xa = obj.geometry.xyz # The lasto in siesta requires lasto(0) == 0 # and secondly, the Python index to fortran # index makes firsto behave like fortran lasto lasto = obj.geometry.firsto bloch = _a.onesi(3) mu = mu NE = len(E) if E.dtype not in [np.complex64, np.complex128]: E = E + 1j * obj.eta Nk = len(bz) k = bz.k w = bz.weight sizes = { 'na_used': na_u, 'nkpt': Nk, 'ne': NE, } self._nspin = nspin self._E = E self._k = np.copy(k) self._nE = len(E) self._nk = len(k) if self._nspin > 2: self._no_u = no_u * 2 else: self._no_u = no_u # Ensure it is open (in write mode) self._close_gf() self._open_gf('w') # Now write to it... self._step_counter('write_header', header=True, read=True) # see onlysSileSiesta.read_supercell for .T _siesta.write_gf_header(self._iu, nspin, _toF(cell.T, np.float64, 1. / _Bohr2Ang), na_u, no_u, no_u, _toF(xa.T, np.float64, 1. / _Bohr2Ang), lasto, bloch, 0, mu * _eV2Ry, _toF(k.T, np.float64), w, self._E / self._E_Ry2eV, **sizes) self._fortran_check('write_header', 'could not write header information.') def write_hamiltonian(self, H, S=None): """ Write the current energy, k-point and H and S to the file Parameters ---------- H : matrix a square matrix corresponding to the Hamiltonian S : matrix, optional a square matrix corresponding to the overlap, for efficiency reasons it may be advantageous to specify this argument for orthogonal cells. """ no = len(H) if S is None: S = np.eye(no, dtype=np.complex128, order='F') self._step_counter('write_hamiltonian', HS=True, read=True) _siesta.write_gf_hs(self._iu, self._ik, self._E[self._iE] / self._E_Ry2eV, _toF(H, np.complex128, _eV2Ry), _toF(S, np.complex128), no_u=no) self._fortran_check('write_hamiltonian', 'could not write Hamiltonian and overlap matrices.') def write_self_energy(self, SE): r""" Write the current self energy, k-point and H and S to the file The self-energy must correspond to the *bulk* self-energy .. math:: \boldsymbol \Sigma_{\mathrm{bulk}}(E) = \mathbf S E - \mathbf H - \boldsymbol \Sigma(E) Parameters ---------- SE : matrix a square matrix corresponding to the self-energy (Green function) """ no = len(SE) self._step_counter('write_self_energy', read=True) _siesta.write_gf_se(self._iu, self._ik, self._iE, self._E[self._iE] / self._E_Ry2eV, _toF(SE, np.complex128, _eV2Ry), no_u=no) self._fortran_check('write_self_energy', 'could not write self-energy.') def __len__(self): return self._nE * self._nk * self._nspin def __iter__(self): """ Iterate through the energies and k-points that this GF file is associated with Yields ------ bool, list of float, float """ # get everything e = self._E if self._nspin in [1, 2]: GFStep = namedtuple("GFStep", ["spin", "do_HS", "k", "E"]) for ispin in range(self._nspin): for k in self._k: yield GFStep(ispin, True, k, e[0]) for E in e[1:]: yield GFStep(ispin, False, k, E) else: GFStep = namedtuple("GFStep", ["do_HS", "k", "E"]) for k in self._k: yield GFStep(True, k, e[0]) for E in e[1:]: yield GFStep(False, k, E) # We will automatically close once we hit the end self._close_gf() def _type(name, obj, dic=None): if dic is None: dic = {} # Always pass the docstring if not '__doc__' in dic: try: dic['__doc__'] = obj.__doc__.replace(obj.__name__, name) except: pass return type(name, (obj, ), dic) # Faster than class ... \ pass tsgfSileSiesta = _type("tsgfSileSiesta", _gfSileSiesta) gridSileSiesta = _type("gridSileSiesta", _gridSileSiesta, {'grid_unit': 1.}) if found_module: add_sile('TSHS', tshsSileSiesta) add_sile('onlyS', onlysSileSiesta) add_sile('TSDE', tsdeSileSiesta) add_sile('DM', dmSileSiesta) add_sile('HSX', hsxSileSiesta) add_sile('TSGF', tsgfSileSiesta) add_sile('WFSX', wfsxSileSiesta) # These have unit-conversions add_sile('RHO', _type("rhoSileSiesta", _gridSileSiesta, {'grid_unit': 1./_Bohr2Ang ** 3})) add_sile('LDOS', _type("ldosSileSiesta", _gridSileSiesta, {'grid_unit': 1./_Bohr2Ang ** 3})) add_sile('RHOINIT', _type("rhoinitSileSiesta", _gridSileSiesta, {'grid_unit': 1./_Bohr2Ang ** 3})) add_sile('RHOXC', _type("rhoxcSileSiesta", _gridSileSiesta, {'grid_unit': 1./_Bohr2Ang ** 3})) add_sile('DRHO', _type("drhoSileSiesta", _gridSileSiesta, {'grid_unit': 1./_Bohr2Ang ** 3})) add_sile('BADER', _type("baderSileSiesta", _gridSileSiesta, {'grid_unit': 1./_Bohr2Ang ** 3})) add_sile('IOCH', _type("iorhoSileSiesta", _gridSileSiesta, {'grid_unit': 1./_Bohr2Ang ** 3})) add_sile('TOCH', _type("totalrhoSileSiesta", _gridSileSiesta, {'grid_unit': 1./_Bohr2Ang ** 3})) # The following two files *require* that # STM.DensityUnits Ele/bohr**3 # which I can't check! # They are however the default add_sile('STS', _type("stsSileSiesta", _gridSileSiesta, {'grid_unit': 1./_Bohr2Ang ** 3})) add_sile('STM.LDOS', _type("stmldosSileSiesta", _gridSileSiesta, {'grid_unit': 1./_Bohr2Ang ** 3})) add_sile('VH', _type("hartreeSileSiesta", _gridSileSiesta, {'grid_unit': _Ry2eV})) add_sile('VNA', _type("neutralatomhartreeSileSiesta", _gridSileSiesta, {'grid_unit': _Ry2eV})) add_sile('VT', _type("totalhartreeSileSiesta", _gridSileSiesta, {'grid_unit': _Ry2eV}))