`kups.application.mcmc.data` ¶

Reusable data types and configuration for rigid-body MCMC simulations.

`AdsorbateConfig` ¶

Bases: BaseModel

Configuration for a single adsorbate species.

Thermodynamic parameters feed Peng-Robinson EOS for fugacity calculation. Molecular geometry is defined by positions and symbols; charges, masses, and atomic numbers are auto-derived from ASE if omitted.

Source code in src/kups/application/mcmc/data.py

class AdsorbateConfig(BaseModel):
    """Configuration for a single adsorbate species.

    Thermodynamic parameters feed Peng-Robinson EOS for fugacity calculation.
    Molecular geometry is defined by ``positions`` and ``symbols``; charges,
    masses, and atomic numbers are auto-derived from ASE if omitted.
    """

    critical_temperature: float
    """Critical temperature (K) for Peng-Robinson EOS."""
    critical_pressure: float
    """Critical pressure (Pa) for Peng-Robinson EOS."""
    acentric_factor: float
    """Acentric factor (dimensionless)."""
    positions: tuple[tuple[float, float, float], ...]
    """Atom positions within the molecule, relative to its centre of mass (Ang)."""
    symbols: tuple[str, ...]
    """Element symbols for each atom in the molecule."""
    charges: tuple[float, ...] = ()
    """Partial charges on each atom (e). Defaults to zeros."""
    masses: tuple[float, ...] = ()
    """Atomic masses (amu). Derived from symbols via ASE if omitted."""
    atomic_numbers: tuple[int, ...] = ()
    """Atomic numbers. Derived from symbols via ASE if omitted."""

    @model_validator(mode="before")
    @classmethod
    def _fill_defaults_from_ase(cls, data: dict) -> dict:  # type: ignore[override]
        """Derive charges, masses, and atomic numbers from symbols when absent."""
        symbols = data.get("symbols", ())
        if not data.get("charges"):
            data["charges"] = tuple(0.0 for _ in symbols)
        if not data.get("masses") or not data.get("atomic_numbers"):
            zs = [ase.data.atomic_numbers.get(s.split("_")[0], 0) for s in symbols]
            if not data.get("masses"):
                data["masses"] = tuple(
                    float(ase.data.atomic_masses[z]) if z > 0 else 0.0 for z in zs
                )
            if not data.get("atomic_numbers"):
                data["atomic_numbers"] = tuple(zs)
        return data

    @property
    def as_particles(self) -> Table[MotifParticleId, MotifParticles]:
        """Convert this adsorbate config into indexed particles with motif data."""
        n = len(self.symbols)
        assert self.masses is not None
        assert self.atomic_numbers is not None
        assert self.charges is not None
        return Table.arange(
            MotifParticles(
                positions=jnp.asarray(self.positions),
                masses=jnp.asarray(self.masses),
                atomic_numbers=jnp.asarray(self.atomic_numbers),
                charges=jnp.asarray(self.charges),
                labels=Index.new(list(map(Label, self.symbols))),
                motif=Index.integer(
                    jnp.zeros(n, dtype=int),
                    label=MotifId,
                    max_count=len(self.positions),
                ),
            ),
            label=MotifParticleId,
        )

`acentric_factor` `instance-attribute` ¶

Acentric factor (dimensionless).

`as_particles` `property` ¶

Convert this adsorbate config into indexed particles with motif data.

`atomic_numbers = ()` `class-attribute` `instance-attribute` ¶

Atomic numbers. Derived from symbols via ASE if omitted.

`charges = ()` `class-attribute` `instance-attribute` ¶

Partial charges on each atom (e). Defaults to zeros.

`critical_pressure` `instance-attribute` ¶

Critical pressure (Pa) for Peng-Robinson EOS.

`critical_temperature` `instance-attribute` ¶

Critical temperature (K) for Peng-Robinson EOS.

`masses = ()` `class-attribute` `instance-attribute` ¶

Atomic masses (amu). Derived from symbols via ASE if omitted.

`positions` `instance-attribute` ¶

Atom positions within the molecule, relative to its centre of mass (Ang).

`symbols` `instance-attribute` ¶

Element symbols for each atom in the molecule.

`BlockingSphereConfig` ¶

Bases: BaseModel

Configuration for a blocking sphere to prevent adsorbate placement in certain regions.

Source code in src/kups/application/mcmc/data.py

class BlockingSphereConfig(BaseModel):
    """Configuration for a blocking sphere to prevent adsorbate placement in certain regions."""

    center: tuple[float, float, float]
    """Center of the blocking sphere in Cartesian coordinates (Ang)."""
    radius: float
    """Radius of the blocking sphere (Ang)."""

`center` `instance-attribute` ¶

Center of the blocking sphere in Cartesian coordinates (Ang).

`radius` `instance-attribute` ¶

Radius of the blocking sphere (Ang).

`EwaldCfg` ¶

Bases: BaseModel

Ewald summation settings for electrostatic interactions.

Source code in src/kups/application/mcmc/data.py

class EwaldCfg(BaseModel):
    """Ewald summation settings for electrostatic interactions."""

    enabled: bool = True
    cutoff: float = 12.0
    """Real-space cutoff (Ang)."""
    precision: float = 1e-6
    """Target error tolerance."""

`cutoff = 12.0` `class-attribute` `instance-attribute` ¶

Real-space cutoff (Ang).

`precision = 1e-06` `class-attribute` `instance-attribute` ¶

Target error tolerance.

`HostConfig` ¶

Bases: BaseModel

Configuration for a single host framework (e.g. zeolite, MOF).

Each host gets its own system with unit cell, thermodynamic conditions, and optional initial adsorbate placement.

Source code in src/kups/application/mcmc/data.py

class HostConfig(BaseModel):
    """Configuration for a single host framework (e.g. zeolite, MOF).

    Each host gets its own system with unit cell, thermodynamic conditions,
    and optional initial adsorbate placement.
    """

    cif_file: str
    """Path to the host structure CIF file."""
    pressure: float
    """System pressure (Pa)."""
    temperature: float
    """System temperature (K)."""
    init_adsorbates: tuple[int, ...] = (0,)
    """Number of initial adsorbates per species to randomly insert."""
    adsorbate_composition: tuple[float, ...] = (1.0,)
    """Mole fractions for each adsorbate component (must sum to 1)."""
    adsorbate_interaction: tuple[tuple[float, ...], ...] = ((0.0,),)
    """Binary interaction parameters k_ij (n_ads x n_ads)."""
    cell_replication: int | tuple[int, int, int] | None = None
    """(nx, ny, nz) replication of the unit cell. Auto-computed if None."""
    blocking_spheres: tuple[tuple[BlockingSphereConfig, ...], ...] = ((),)
    """Blocking spheres preventing adsorbate placement in selected regions. Outer
    tuple is indexed per adsorbate species; each inner tuple lists spheres for that
    species and may have variable length."""

`adsorbate_composition = (1.0,)` `class-attribute` `instance-attribute` ¶

Mole fractions for each adsorbate component (must sum to 1).

`adsorbate_interaction = ((0.0,),)` `class-attribute` `instance-attribute` ¶

Binary interaction parameters k_ij (n_ads x n_ads).

`blocking_spheres = ((),)` `class-attribute` `instance-attribute` ¶

Blocking spheres preventing adsorbate placement in selected regions. Outer tuple is indexed per adsorbate species; each inner tuple lists spheres for that species and may have variable length.

`cell_replication = None` `class-attribute` `instance-attribute` ¶

(nx, ny, nz) replication of the unit cell. Auto-computed if None.

`cif_file` `instance-attribute` ¶

Path to the host structure CIF file.

`init_adsorbates = (0,)` `class-attribute` `instance-attribute` ¶

Number of initial adsorbates per species to randomly insert.

`pressure` `instance-attribute` ¶

System pressure (Pa).

`temperature` `instance-attribute` ¶

System temperature (K).

`LJConfig` ¶

Bases: BaseModel

Lennard-Jones force-field parameters.

Source code in src/kups/application/mcmc/data.py

class LJConfig(BaseModel):
    """Lennard-Jones force-field parameters."""

    parameters: dict[str, tuple[float, float]]
    """Mapping symbol -> (epsilon/kB [K], sigma [Ang]) for each element type."""
    cutoff: float = 12.0
    """Real-space cutoff (Ang)."""
    tail_correction: bool = True
    """Apply long-range tail correction."""

`cutoff = 12.0` `class-attribute` `instance-attribute` ¶

Real-space cutoff (Ang).

`parameters` `instance-attribute` ¶

Mapping symbol -> (epsilon/kB [K], sigma [Ang]) for each element type.

`tail_correction = True` `class-attribute` `instance-attribute` ¶

Apply long-range tail correction.

`MCMCGroup` ¶

Molecular group state for rigid-body MCMC.

Attributes:

Name	Type	Description
`system`	`Index[SystemId]`	Index mapping each group to its parent system.
`motif`	`Index[MotifId]`	Index mapping each group to its adsorbate species.

Source code in src/kups/application/mcmc/data.py

@dataclass
class MCMCGroup:
    """Molecular group state for rigid-body MCMC.

    Attributes:
        system: Index mapping each group to its parent system.
        motif: Index mapping each group to its adsorbate species.
    """

    system: Index[SystemId]
    motif: Index[MotifId]

    @property
    def labels(self) -> Index[Label]:
        """Group labels derived from motif index."""
        return Index(tuple(Label(str(m)) for m in self.motif.keys), self.motif.indices)

`labels` `property` ¶

Group labels derived from motif index.

`MCMCParticles` ¶

Bases: Particles

Particle state for rigid-body MCMC with group membership.

Attributes:

Name	Type	Description
`group`	`Index[GroupId]`	Index mapping each particle to its molecular group.

Source code in src/kups/application/mcmc/data.py

@dataclass
class MCMCParticles(Particles):
    """Particle state for rigid-body MCMC with group membership.

    Attributes:
        group: Index mapping each particle to its molecular group.
    """

    group: Index[GroupId]
    motif: Index[MotifParticleId]
    position_gradients: Array = field(default=None)  # type: ignore[assignment]

    def __post_init__(self):
        if self.position_gradients is None:
            object.__setattr__(
                self, "position_gradients", jnp.zeros_like(self.positions)
            )

    @property
    def inclusion(self) -> Index[InclusionId]:
        """Inclusion index derived from the system index."""
        return Index(
            tuple(InclusionId(lab) for lab in self.system.keys),
            self.system.indices,
            self.system.max_count,
        )

    @property
    def exclusion(self) -> Index[ExclusionId]:
        """Exclusion index derived from the group index."""
        return Index(
            tuple(ExclusionId(lab) for lab in self.group.keys),
            self.group.indices,
            self.group.max_count,
        )

    def guest_only(self) -> MCMCParticles:
        # Buffered sanitizes the the data to only include particles with valid group membership.
        return Buffered.arange(self, view=lambda x: x.group).data

`exclusion` `property` ¶

Exclusion index derived from the group index.

`inclusion` `property` ¶

Inclusion index derived from the system index.

`MCMCSystems` ¶

Per-system thermodynamic state for MCMC simulations.

Attributes:

Name	Type	Description
`cell`	`Cell`	Cell geometry, batched shape `(n_systems,)`.
`temperature`	`Array`	Temperature (K), shape `(n_systems,)`.
`potential_energy`	`Array`	Total potential energy per system (eV), shape `(n_systems,)`.
`log_fugacity`	`Array`	Log fugacity per species (dimensionless), shape `(n_systems, n_species)`.

Source code in src/kups/application/mcmc/data.py

@dataclass
class MCMCSystems:
    """Per-system thermodynamic state for MCMC simulations.

    Attributes:
        cell: Cell geometry, batched shape ``(n_systems,)``.
        temperature: Temperature (K), shape ``(n_systems,)``.
        potential_energy: Total potential energy per system (eV), shape ``(n_systems,)``.
        log_fugacity: Log fugacity per species (dimensionless), shape ``(n_systems, n_species)``.
    """

    cell: Cell
    temperature: Array
    potential_energy: Array
    log_fugacity: Array
    cell_gradients: Cell = field(default=None)  # type: ignore[assignment]

    def __post_init__(self):
        if self.cell_gradients is None:
            object.__setattr__(self, "cell_gradients", tree_zeros_like(self.cell))

    @property
    def log_activity(self) -> Array:
        """Log activity: log(fugacity / kT), shape ``(n_systems, n_species)``."""
        return (
            self.log_fugacity - jnp.log(self.temperature * BOLTZMANN_CONSTANT)[:, None]
        )

`log_activity` `property` ¶

Log activity: log(fugacity / kT), shape (n_systems, n_species).

`MotifParticles` ¶

Template particle data for an adsorbate motif (molecule template).

Stores the reference geometry, atomic properties, and species assignment for each atom in an adsorbate molecule. Used as a lookup table during exchange moves to populate new particle data.

Attributes:

Name	Type	Description
`positions`	`Array`	Reference atom positions relative to COM (Ang), shape `(n_atoms, 3)`.
`masses`	`Array`	Atomic masses (amu), shape `(n_atoms,)`.
`atomic_numbers`	`Array`	Atomic numbers, shape `(n_atoms,)`.
`charges`	`Array`	Partial charges (e), shape `(n_atoms,)`.
`labels`	`Index[Label]`	Per-atom string labels.
`motif`	`Index[MotifId]`	Index mapping atoms to their species (MotifId).

Source code in src/kups/application/mcmc/data.py

@dataclass
class MotifParticles:
    """Template particle data for an adsorbate motif (molecule template).

    Stores the reference geometry, atomic properties, and species assignment
    for each atom in an adsorbate molecule. Used as a lookup table during
    exchange moves to populate new particle data.

    Attributes:
        positions: Reference atom positions relative to COM (Ang), shape ``(n_atoms, 3)``.
        masses: Atomic masses (amu), shape ``(n_atoms,)``.
        atomic_numbers: Atomic numbers, shape ``(n_atoms,)``.
        charges: Partial charges (e), shape ``(n_atoms,)``.
        labels: Per-atom string labels.
        motif: Index mapping atoms to their species (MotifId).
    """

    positions: Array
    masses: Array
    atomic_numbers: Array
    charges: Array
    labels: Index[Label]
    motif: Index[MotifId]

`RunConfig` ¶

Bases: BaseModel

Run configuration for MCMC simulation.

Source code in src/kups/application/mcmc/data.py

class RunConfig(BaseModel):
    """Run configuration for MCMC simulation."""

    out_file: str | Path
    """Path to the output HDF5 file."""
    num_cycles: int
    """Number of production cycles."""
    num_warmup_cycles: int
    """Number of warmup cycles (not written to output)."""
    min_cycle_length: int
    translation_prob: float = 1 / 6
    rotation_prob: float = 1 / 6
    reinsertion_prob: float = 1 / 6
    exchange_prob: float = 1 / 2
    """Ordered move sequence for the palindrome propagator."""
    seed: int | None = None
    """Random seed. ``None`` uses a time-based seed."""

`exchange_prob = 1 / 2` `class-attribute` `instance-attribute` ¶

Ordered move sequence for the palindrome propagator.

`num_cycles` `instance-attribute` ¶

Number of production cycles.

`num_warmup_cycles` `instance-attribute` ¶

Number of warmup cycles (not written to output).

`out_file` `instance-attribute` ¶

Path to the output HDF5 file.

`seed = None` `class-attribute` `instance-attribute` ¶

Random seed. None uses a time-based seed.

`StressResult` ¶

Bases: NamedTuple

Decomposed stress tensor with potential, tail correction, and ideal gas components.

Source code in src/kups/application/mcmc/data.py

class StressResult(NamedTuple):
    """Decomposed stress tensor with potential, tail correction, and ideal gas components."""

    potential: Array
    tail_correction: Array
    ideal_gas: Array

`mcmc_state_from_config(key, host, adsorbates)` ¶

Build per-host MCMC state from ASE Atoms and adsorbate configs.

Host atoms get one group each (sentinel motif). Initial adsorbates from host.init_adsorbates are placed randomly within the unit cell. Log activity is computed internally via Peng-Robinson EOS.

Parameters:

Name	Type	Description	Default
`key`	`Array`	JAX PRNG key for random adsorbate placement.	required
`host`	`HostConfig`	Host configuration.	required
`adsorbates`	`tuple[AdsorbateConfig, ...]`	Adsorbate species configurations.	required

Returns:

Type	Description
`tuple[Table[ParticleId, MCMCParticles], Table[GroupId, MCMCGroup], Table[SystemId, MCMCSystems], Table[MotifParticleId, MotifParticles]]`	Tuple of `(particles, groups, system, motifs)`.

Source code in src/kups/application/mcmc/data.py

def mcmc_state_from_config(
    key: Array,
    host: HostConfig,
    adsorbates: tuple[AdsorbateConfig, ...],
) -> tuple[
    Table[ParticleId, MCMCParticles],
    Table[GroupId, MCMCGroup],
    Table[SystemId, MCMCSystems],
    Table[MotifParticleId, MotifParticles],
]:
    """Build per-host MCMC state from ASE Atoms and adsorbate configs.

    Host atoms get one group each (sentinel motif). Initial adsorbates
    from ``host.init_adsorbates`` are placed randomly within the unit cell.
    Log activity is computed internally via Peng-Robinson EOS.

    Args:
        key: JAX PRNG key for random adsorbate placement.
        host: Host configuration.
        adsorbates: Adsorbate species configurations.

    Returns:
        Tuple of ``(particles, groups, system, motifs)``.
    """
    hp, cell, _ = particles_from_ase(host.cif_file)
    p = hp.data
    n_host = len(hp.keys)
    if host.cell_replication is not None:
        pos_lens = lens(lambda x: x.positions, cls=Particles)
        p = pos_lens.apply(p, cell.wrap)
        cell, p = make_supercell(cell, host.cell_replication, p, pos_lens)
        n_host = len(p.positions)
    n_ads = len(adsorbates)

    # Build motifs: concatenate with a MotifId group to assign unique species indices
    ads_particles = [c.as_particles for c in adsorbates]
    motif_ids = [Table((MotifId(0),), jnp.zeros(1)) for _ in ads_particles]
    motifs, _ = Table.union(ads_particles, motif_ids)

    # Compute log activity via Peng-Robinson EOS
    crit_temps = jnp.asarray([a.critical_temperature for a in adsorbates])
    crit_press = jnp.asarray([a.critical_pressure for a in adsorbates])
    acentric = jnp.asarray([a.acentric_factor for a in adsorbates])
    result = peng_robinson_log_fugacity(
        jnp.asarray(float(host.pressure)) * PASCAL,
        jnp.asarray(float(host.temperature)) * KELVIN,
        crit_press * PASCAL,
        crit_temps * KELVIN,
        acentric,
        jnp.asarray(host.adsorbate_composition),
        jnp.asarray(host.adsorbate_interaction),
    )

    # Host
    system = Table.arange(
        MCMCSystems(
            cell=cell[None],
            temperature=jnp.array([host.temperature]),
            potential_energy=jnp.zeros(1),
            log_fugacity=result.log_fugacity[None],
        ),
        label=SystemId,
    )
    # Particles
    host_particles = Table.arange(
        MCMCParticles(
            positions=p.positions,
            masses=p.masses,
            atomic_numbers=p.atomic_numbers,
            charges=p.charges,
            labels=p.labels,
            system=Index.zeros(n_host, label=SystemId),
            group=Index.integer(jnp.zeros(n_host, dtype=int), n=0, label=GroupId),
            motif=Index.integer(
                jnp.zeros(n_host, dtype=int), n=0, label=MotifParticleId
            ),
        ),
        label=ParticleId,
    )
    host_groups = Table.arange(
        MCMCGroup(
            system=Index.zeros(0, label=SystemId),
            motif=Index.integer(jnp.full(0, n_ads, dtype=int), n=n_ads, label=MotifId),
        ),
        label=GroupId,
    )

    # Place initial adsorbates
    ads_parts: list[Table[ParticleId, MCMCParticles]] = []
    ads_groups: list[Table[GroupId, MCMCGroup]] = []
    for motif_idx, n_init in enumerate(host.init_adsorbates):
        idx = Index.integer(np.array([motif_idx]), label=MotifId)
        for _ in range(n_init):
            key, subkey = jax.random.split(key)
            mol_p, mol_g = _make_molecule(motifs, idx, cell, subkey)
            ads_parts.append(mol_p)
            ads_groups.append(mol_g)

    # Merge host + adsorbate parts
    particles, groups = Table.union(
        [host_particles, *ads_parts], [host_groups, *ads_groups]
    )
    # Store the maximum motif size
    particles = bind(
        particles, lambda x: (x.data.motif.keys, x.data.group.max_count)
    ).set((motifs.keys, motifs.data.motif.max_count))
    return particles, groups, system, motifs

kups.application.mcmc.data ¶

AdsorbateConfig ¶

acentric_factor instance-attribute ¶

as_particles property ¶

atomic_numbers = () class-attribute instance-attribute ¶

charges = () class-attribute instance-attribute ¶

critical_pressure instance-attribute ¶

critical_temperature instance-attribute ¶

masses = () class-attribute instance-attribute ¶

positions instance-attribute ¶

symbols instance-attribute ¶

BlockingSphereConfig ¶

center instance-attribute ¶

radius instance-attribute ¶

EwaldCfg ¶

cutoff = 12.0 class-attribute instance-attribute ¶

precision = 1e-06 class-attribute instance-attribute ¶

HostConfig ¶

adsorbate_composition = (1.0,) class-attribute instance-attribute ¶

adsorbate_interaction = ((0.0,),) class-attribute instance-attribute ¶

blocking_spheres = ((),) class-attribute instance-attribute ¶

cell_replication = None class-attribute instance-attribute ¶

cif_file instance-attribute ¶

init_adsorbates = (0,) class-attribute instance-attribute ¶

pressure instance-attribute ¶

temperature instance-attribute ¶

LJConfig ¶

cutoff = 12.0 class-attribute instance-attribute ¶

parameters instance-attribute ¶

tail_correction = True class-attribute instance-attribute ¶

MCMCGroup ¶

labels property ¶

MCMCParticles ¶

exclusion property ¶

inclusion property ¶

MCMCSystems ¶

log_activity property ¶

MotifParticles ¶

RunConfig ¶

exchange_prob = 1 / 2 class-attribute instance-attribute ¶

num_cycles instance-attribute ¶

num_warmup_cycles instance-attribute ¶

out_file instance-attribute ¶

seed = None class-attribute instance-attribute ¶

StressResult ¶

mcmc_state_from_config(key, host, adsorbates) ¶

`kups.application.mcmc.data` ¶

`AdsorbateConfig` ¶

`acentric_factor` `instance-attribute` ¶

`as_particles` `property` ¶

`atomic_numbers = ()` `class-attribute` `instance-attribute` ¶

`charges = ()` `class-attribute` `instance-attribute` ¶

`critical_pressure` `instance-attribute` ¶

`critical_temperature` `instance-attribute` ¶

`masses = ()` `class-attribute` `instance-attribute` ¶

`positions` `instance-attribute` ¶

`symbols` `instance-attribute` ¶

`BlockingSphereConfig` ¶

`center` `instance-attribute` ¶

`radius` `instance-attribute` ¶

`EwaldCfg` ¶

`cutoff = 12.0` `class-attribute` `instance-attribute` ¶

`precision = 1e-06` `class-attribute` `instance-attribute` ¶

`HostConfig` ¶

`adsorbate_composition = (1.0,)` `class-attribute` `instance-attribute` ¶

`adsorbate_interaction = ((0.0,),)` `class-attribute` `instance-attribute` ¶

`blocking_spheres = ((),)` `class-attribute` `instance-attribute` ¶

`cell_replication = None` `class-attribute` `instance-attribute` ¶

`cif_file` `instance-attribute` ¶

`init_adsorbates = (0,)` `class-attribute` `instance-attribute` ¶

`pressure` `instance-attribute` ¶

`temperature` `instance-attribute` ¶

`LJConfig` ¶

`cutoff = 12.0` `class-attribute` `instance-attribute` ¶

`parameters` `instance-attribute` ¶

`tail_correction = True` `class-attribute` `instance-attribute` ¶

`MCMCGroup` ¶

`labels` `property` ¶

`MCMCParticles` ¶

`exclusion` `property` ¶

`inclusion` `property` ¶

`MCMCSystems` ¶

`log_activity` `property` ¶

`MotifParticles` ¶

`RunConfig` ¶

`exchange_prob = 1 / 2` `class-attribute` `instance-attribute` ¶

`num_cycles` `instance-attribute` ¶

`num_warmup_cycles` `instance-attribute` ¶

`out_file` `instance-attribute` ¶

`seed = None` `class-attribute` `instance-attribute` ¶

`StressResult` ¶

`mcmc_state_from_config(key, host, adsorbates)` ¶